From 56be6b7daa7cde882dfc6883f595f824d4ab46ee Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Alexander=20Mei=C3=9Fner?= Date: Wed, 3 Jul 2024 13:46:39 +0200 Subject: [PATCH] Adds documentation for the VMs bytecode. --- docs/bytecode.md | 446 +++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 446 insertions(+) create mode 100644 docs/bytecode.md diff --git a/docs/bytecode.md b/docs/bytecode.md new file mode 100644 index 000000000..bf7e85c03 --- /dev/null +++ b/docs/bytecode.md @@ -0,0 +1,446 @@ +## Bytecode / ISA + +Registers +--------- + +The VM has 12 registers, including 10 general-purpose registers (GPRs). +All of them are 64 bit wide. + +| name | feature set | kind | Solana ABI | +|------:|:------------|:----------------|:-----------------------------------| +| `r0` | all | GPR | Return value | +| `r1` | all | GPR | Argument 0 | +| `r2` | all | GPR | Argument 1 | +| `r3` | all | GPR | Argument 2 | +| `r4` | all | GPR | Argument 3 | +| `r5` | all | GPR | Argument 4
or stack spill ptr | +| `r6` | all | GPR | Call-preserved | +| `r7` | all | GPR | Call-preserved | +| `r8` | all | GPR | Call-preserved | +| `r9` | all | GPR | Call-preserved | +| `r10` | all | Frame pointer | System register | +| `r11` | from v2 | Stack pointer | System register | +| `pc` | all | Program counter | Hidden register | + + +Instruction Layout +------------------ + +The bytecode is encoded in slots of 64 bits. +Instructions occupy either one or two slots, indicated by the opcode of the first slot. + +``` ++-------+--------+---------+---------+--------+-----------+ +| class | opcode | dst reg | src reg | offset | immediate | +| 0..2 | 3..7 | 8..11 | 12..15 | 16..31 | 32..63 | Bits ++-------+--------+---------+---------+--------+-----------+ +low byte high byte +``` + +bit index | meaning +--- | --- +2..0 | instruction class +7..3 | operation code +11..8 | destination register +15..12 | source register +31..16 | offset +63..32 | immediate + + +Class and Operation Codes +------------------------- + +| | ·0 | ·1 | ·2 | ·3 | ·4 | ·5 | ·6 | ·7 | ·8 | ·9 | ·A | ·B | ·C | ·D | ·E | ·F | +|----:|:----:|:----:|:---:|:----:|:------:|:----:|:-------:|:------:|:----:|:-----:|:----:|:-----:|:------:|:-----:|:-------:|:------:| +| 0· | lddw | - | - | - | add32 | ja | - | add64 | - | - | - | - | add32 | - | - | add64 | +| 1· | - | - | - | - | sub32 | jeq | - | sub64 | lddw | - | - | - | sub32 | jeq | - | sub64 | +| 2· | - | - | - | - | mul32 | jgt | - | mul64 | - | - | - | - | mul32 | jgt | - | mul64 | +| 3· | - | - | - | - | div32 | jge | uhmul64 | div64 | - | - | - | - | div32 | jge | uhmul64 | div64 | +| 4· | - | - | - | - | or32 | jset | udiv32 | or64 | - | - | - | - | or32 | jset | udiv32 | or64 | +| 5· | - | - | - | - | and32 | jne | udiv64 | and64 | - | - | - | - | and32 | jne | udiv64 | and64 | +| 6· | - | ldxw | stw | stxw | lsh32 | jsgt | urem32 | lsh64 | - | ldxh | sth | stxh | lsh32 | jsgt | urem32 | lsh64 | +| 7· | - | ldxb | stb | stxb | rsh32 | jsge | urem64 | rsh64 | - | ldxdw | stdw | stxdw | rsh32 | jsge | urem64 | rsh64 | +| 8· | - | - | - | - | neg32 | call | lmul32 | neg64 | - | - | - | - | - | callx | lmul32 | - | +| 9· | - | - | - | - | mod32 | exit | lmul64 | mod64 | - | - | - | - | mod32 | - | lmul64 | mod64 | +| A· | - | - | - | - | xor32 | jlt | - | xor64 | - | - | - | - | xor32 | jlt | - | xor64 | +| B· | - | - | - | - | mov32 | jle | shmul64 | mov64 | - | - | - | - | mov32 | jle | shmul64 | mov64 | +| C· | - | - | - | - | arsh32 | jslt | sdiv32 | arsh64 | - | - | - | - | arsh32 | jslt | sdiv32 | arsh64 | +| D· | - | - | - | - | le | jsle | sdiv64 | - | - | - | - | - | be | jsle | sdiv64 | - | +| E· | - | - | - | - | - | - | srem32 | - | - | - | - | - | - | - | srem32 | - | +| F· | - | - | - | - | - | - | srem64 | hor64 | - | - | - | - | - | - | srem64 | - | + + +Instructions by Class +--------------------- + +The following Rust equivalents assume that: +- `src` and `dst` registers are `u64` +- `imm` is `u32` +- `off` is `u16` + +### 32 bit Arithmetic and Logic +opcode (hex / bin) | feature set | assembler mnemonic | Rust equivalent +------------------ | ----------- | ------------------ | --------------- +`04` / `00000100` | until v2 | `add32 dst, imm` | `dst = (dst as u32).wrapping_add(imm) as i32 as i64 as u64` +`04` / `00000100` | from v2 | `add32 dst, imm` | `dst = (dst as u32).wrapping_add(imm) as u64` +`0C` / `00001100` | until v2 | `add32 dst, src` | `dst = (dst as u32).wrapping_add(src as u32) as i32 as i64 as u64` +`0C` / `00001100` | from v2 | `add32 dst, src` | `dst = (dst as u32).wrapping_add(src as u32) as u64` +`14` / `00010100` | until v2 | `sub32 dst, imm` | `dst = (dst as u32).wrapping_sub(imm) as u64` +`14` / `00010100` | from v2 | `sub32 dst, imm` | `dst = imm.wrapping_sub(dst as u32) as u64` +`1C` / `00011100` | all | `sub32 dst, src` | `dst = (dst as u32).wrapping_sub(src as u32) as u64` +`24` / `00100100` | until v2 | `mul32 dst, imm` | `dst = (dst as i32).wrapping_mul(imm as i32) as i64 as u64` +`2C` / `00101100` | until v2 | `mul32 dst, src` | `dst = (dst as i32).wrapping_mul(src as i32) as i64 as u64` +`34` / `00110100` | until v2 | `div32 dst, imm` | `dst = ((dst as u32) / imm) as u64` +`3C` / `00111100` | until v2 | `div32 dst, src` | `dst = ((dst as u32) / (src as u32)) as u64` +`44` / `01000100` | all | `or32 dst, imm` | `dst = (dst as u32).or(imm) as u64` +`4C` / `01001100` | all | `or32 dst, src` | `dst = (dst as u32).or(src as u32) as u64` +`54` / `01010100` | all | `and32 dst, imm` | `dst = (dst as u32).and(imm) as u64` +`5C` / `01011100` | all | `and32 dst, src` | `dst = (dst as u32).and(src as u32) as u64` +`64` / `01100100` | all | `lsh32 dst, imm` | `dst = (dst as u32).wrapping_shl(imm) as u64` +`6C` / `01101100` | all | `lsh32 dst, src` | `dst = (dst as u32).wrapping_shl(src as u32) as u64` +`74` / `01110100` | all | `rsh32 dst, imm` | `dst = (dst as u32).wrapping_shr(imm) as u64` +`7C` / `01111100` | all | `rsh32 dst, src` | `dst = (dst as u32).wrapping_shr(src as u32) as u64` +`84` / `10000100` | until v2 | `neg32 dst` | `dst = (dst as i32).wrapping_neg() as u32 as u64` +`8C` / `10001100` | | -- reserved -- +`94` / `10010100` | until v2 | `mod32 dst, imm` | `dst = ((dst as u32) % imm) as u64` +`9C` / `10011100` | until v2 | `mod32 dst, src` | `dst = ((dst as u32) % (src as u32)) as u64` +`A4` / `10100100` | all | `xor32 dst, imm` | `dst = (dst as u32).xor(imm) as u64` +`AC` / `10101100` | all | `xor32 dst, src` | `dst = (dst as u32).xor(src as u32) as u64` +`B4` / `10110100` | all | `mov32 dst, imm` | `dst = imm as i32 as i64 as u64` +`BC` / `10111100` | until v2 | `mov32 dst, src` | `dst = src as u32 as u64` +`BC` / `10111100` | from v2 | `mov32 dst, src` | `dst = src as i32 as i64 as u64` +`C4` / `11000100` | all | `ash32 dst, imm` | `dst = (dst as i32).wrapping_shr(imm) as u32 as u64` +`CC` / `11001100` | all | `ash32 dst, src` | `dst = (dst as i32).wrapping_shr(src as u32) as u32 as u64` +`D4` / `11010100` | until v2 | `le dst, imm=16/32/64` +`DC` / `11011100` | all | `be dst, imm=16/32/64` +`E4` / `11100100` | | -- reserved -- +`EC` / `11101100` | | -- reserved -- +`F4` / `11110100` | | -- reserved -- +`FC` / `11111100` | | -- reserved -- + +### 64 bit Arithmetic and Logic +opcode (hex / bin) | feature set | assembler mnemonic | Rust equivalent +------------------ | ----------- | ------------------ | --------------- +`07` / `00000111` | all | `add64 dst, imm` | `dst = dst.wrapping_add(imm as i32 as i64 as u64)` +`0F` / `00001111` | all | `add64 dst, src` | `dst = dst.wrapping_add(src)` +`17` / `00010111` | until v2 | `sub64 dst, imm` | `dst = dst.wrapping_sub(imm as i32 as i64 as u64)` +`17` / `00010111` | from v2 | `sub64 dst, imm` | `dst = (imm as i32 as i64 as u64).wrapping_sub(dst)` +`1F` / `00011111` | all | `sub64 dst, src` | `dst = dst.wrapping_sub(src)` +`27` / `00100111` | until v2 | `mul64 dst, imm` | `dst = dst.wrapping_mul(imm as u64)` +`2F` / `00101111` | until v2 | `mul64 dst, src` | `dst = dst.wrapping_mul(src)` +`37` / `00110111` | until v2 | `div64 dst, imm` | `dst = dst / (imm as u64)` +`3F` / `00111111` | until v2 | `div64 dst, src` | `dst = dst / src` +`47` / `01000111` | all | `or64 dst, imm` | `dst = dst.or(imm)` +`4F` / `01001111` | all | `or64 dst, src` | `dst = dst.or(src)` +`57` / `01010111` | all | `and64 dst, imm` | `dst = dst.and(imm)` +`5F` / `01011111` | all | `and64 dst, src` | `dst = dst.and(src)` +`67` / `01100111` | all | `lsh64 dst, imm` | `dst = dst.wrapping_shl(imm)` +`6F` / `01101111` | all | `lsh64 dst, src` | `dst = dst.wrapping_shl(src as u32)` +`77` / `01110111` | all | `rsh64 dst, imm` | `dst = dst.wrapping_shr(imm)` +`7F` / `01111111` | all | `rsh64 dst, src` | `dst = dst.wrapping_shr(src as u32)` +`87` / `10000111` | until v2 | `neg64 dst` | `dst = (dst as i64).wrapping_neg() as u64` +`8F` / `10001111` | | -- reserved -- +`97` / `10010111` | until v2 | `mod64 dst, imm` | `dst = dst % (imm as u64)` +`9F` / `10011111` | until v2 | `mod64 dst, src` | `dst = dst % src` +`A7` / `10100111` | all | `xor64 dst, imm` | `dst = dst.xor(imm)` +`AF` / `10101111` | all | `xor64 dst, src` | `dst = dst.xor(src)` +`B7` / `10110111` | all | `mov64 dst, imm` | `dst = imm as u64` +`BF` / `10111111` | all | `mov64 dst, src` | `dst = src` +`C7` / `11000111` | all | `ash64 dst, imm` | `dst = (dst as i64).wrapping_shr(imm)` +`CF` / `11001111` | all | `ash64 dst, src` | `dst = (dst as i64).wrapping_shr(src as u32)` +`D7` / `11010111` | | -- reserved -- +`DF` / `11011111` | | -- reserved -- +`E7` / `11100111` | | -- reserved -- +`EF` / `11101111` | | -- reserved -- +`F7` / `11110111` | from v2 | `hor64 dst, imm` | `dst = dst.or((imm as u64).wrapping_shl(32))` +`FF` / `11111111` | | -- reserved -- + +### Product / Quotient / Remainder +bit index | when `0` | when `1` +--- | --- | --- +3 | immediate | register +4 | 32 bit | 64 bit +5 | low product / quotient | high product / remainder +6 | multiplication | division +7 | unsigned | signed + +#### Panics +- Division by zero: `if src == 0` +- Negative overflow: `if src == -1 && dst == u64::MIN` + +opcode (hex / bin) | feature set | assembler mnemonic | Rust equivalent +------------------ | ----------- | ------------------ | --------------- +`06` / `00000110` | | -- reserved -- +`0E` / `00001110` | | -- reserved -- +`16` / `00010110` | | -- reserved -- +`1E` / `00011110` | | -- reserved -- +`26` / `00100110` | | -- reserved -- +`2E` / `00101110` | | -- reserved -- +`36` / `00110110` | from v2 | `uhmul64 dst, imm` | `dst = (dst as u128).wrapping_mul(imm as u128).wrapping_shr(64) as u64` +`3E` / `00111110` | from v2 | `uhmul64 dst, src` | `dst = (dst as u128).wrapping_mul(src as u128).wrapping_shr(64) as u64` +`46` / `01000110` | from v2 | `udiv32 dst, imm` | `dst = ((dst as u32) / imm) as u64` +`4E` / `01001110` | from v2 | `udiv32 dst, src` | `dst = ((dst as u32) / (src as u32)) as u64` +`56` / `01010110` | from v2 | `udiv64 dst, imm` | `dst = dst / (imm as u64)` +`5E` / `01011110` | from v2 | `udiv64 dst, src` | `dst = dst / src` +`66` / `01100110` | from v2 | `urem32 dst, imm` | `dst = ((dst as u32) % imm) as u64` +`6E` / `01101110` | from v2 | `urem32 dst, src` | `dst = ((dst as u32) % (src as u32)) as u64` +`76` / `01110110` | from v2 | `urem64 dst, imm` | `dst = dst % (imm as u64)` +`7E` / `01111110` | from v2 | `urem64 dst, src` | `dst = dst % src` +`86` / `10000110` | from v2 | `lmul32 dst, imm` | `dst = (dst as i32).wrapping_mul(imm as i32) as u32 as u64` +`8E` / `10001110` | from v2 | `lmul32 dst, src` | `dst = (dst as i32).wrapping_mul(src as i32) as u32 as u64` +`96` / `10010110` | from v2 | `lmul64 dst, imm` | `dst = dst.wrapping_mul(imm as u64)` +`9E` / `10011110` | from v2 | `lmul64 dst, src` | `dst = dst.wrapping_mul(src)` +`A6` / `10100110` | | -- reserved -- +`AE` / `10101110` | | -- reserved -- +`B6` / `10110110` | from v2 | `shmul64 dst, imm` | `dst = (dst as i128).wrapping_mul(imm as i32 as i128).wrapping_shr(64) as i64 as u64` +`BE` / `10111110` | from v2 | `shmul64 dst, src` | `dst = (dst as i128).wrapping_mul(src as i64 as i128).wrapping_shr(64) as i64 as u64` +`C6` / `11000110` | from v2 | `sdiv32 dst, imm` | `dst = ((dst as i32) / (imm as i32)) as u32 as u64` +`CE` / `11001110` | from v2 | `sdiv32 dst, src` | `dst = ((dst as i32) / (src as i32)) as u32 as u64` +`D6` / `11010110` | from v2 | `sdiv64 dst, imm` | `dst = ((dst as i64) / (imm as i64)) as u64` +`DE` / `11011110` | from v2 | `sdiv64 dst, src` | `dst = ((dst as i64) / (src as i64)) as u64` +`E6` / `11100110` | from v2 | `srem32 dst, imm` | `dst = ((dst as i32) % (imm as i32)) as u32 as u64` +`EE` / `11101110` | from v2 | `srem32 dst, src` | `dst = ((dst as i32) % (src as i32)) as u32 as u64` +`F6` / `11110110` | from v2 | `srem64 dst, imm` | `dst = ((dst as i64) % (imm as i64)) as u64` +`FE` / `11111110` | from v2 | `srem64 dst, src` | `dst = ((dst as i64) % (src as i64)) as u64` + +### Memory + +#### Panics +- Out of bounds: When the memory location is not mapped. +- Access violation: When a store to a readonly region happens. + +opcode (hex / bin) | feature set | assembler mnemonic | Rust equivalent +------------------ | ----------- | ------------------ | --------------- +`00` / `00000000` | until v2 | `lddw dst, imm` | `dst = dst.or((imm as u64).wrapping_shl(32))` +`08` / `00001000` | | -- reserved -- +`10` / `00010000` | | -- reserved -- +`18` / `00011000` | until v2 | `lddw dst, imm` | `dst = imm as u64` +`20` / `00100000` | | -- reserved -- +`28` / `00101000` | | -- reserved -- +`30` / `00110000` | | -- reserved -- +`38` / `00111000` | | -- reserved -- +`40` / `01000000` | | -- reserved -- +`48` / `01001000` | | -- reserved -- +`50` / `01010000` | | -- reserved -- +`58` / `01011000` | | -- reserved -- +`60` / `01100000` | | -- reserved -- +`68` / `01101000` | | -- reserved -- +`70` / `01110000` | | -- reserved -- +`78` / `01111000` | | -- reserved -- +`80` / `10000000` | | -- reserved -- +`88` / `10001000` | | -- reserved -- +`90` / `10010000` | | -- reserved -- +`98` / `10011000` | | -- reserved -- +`A0` / `10100000` | | -- reserved -- +`A8` / `10101000` | | -- reserved -- +`B0` / `10110000` | | -- reserved -- +`B8` / `10111000` | | -- reserved -- +`C0` / `11000000` | | -- reserved -- +`C8` / `11001000` | | -- reserved -- +`D0` / `11010000` | | -- reserved -- +`D8` / `11011000` | | -- reserved -- +`E0` / `11100000` | | -- reserved -- +`E8` / `11101000` | | -- reserved -- +`F0` / `11110000` | | -- reserved -- +`F8` / `11111000` | | -- reserved -- + +opcode (hex / bin) | feature set | assembler mnemonic +------------------ | ----------- | ------------------ +`01` / `00000001` | | -- reserved -- +`09` / `00001001` | | -- reserved -- +`11` / `00010001` | | -- reserved -- +`19` / `00011001` | | -- reserved -- +`21` / `00100001` | | -- reserved -- +`29` / `00101001` | | -- reserved -- +`31` / `00110001` | | -- reserved -- +`39` / `00111001` | | -- reserved -- +`41` / `01000001` | | -- reserved -- +`49` / `01001001` | | -- reserved -- +`51` / `01010001` | | -- reserved -- +`59` / `01011001` | | -- reserved -- +`61` / `01100001` | all | `ldxw dst, [src + off]` +`69` / `01101001` | all | `ldxh dst, [src + off]` +`71` / `01110001` | all | `ldxb dst, [src + off]` +`79` / `01111001` | all | `ldxdw dst, [src + off]` +`81` / `10000001` | | -- reserved -- +`89` / `10001001` | | -- reserved -- +`91` / `10010001` | | -- reserved -- +`99` / `10011001` | | -- reserved -- +`A1` / `10100001` | | -- reserved -- +`A9` / `10101001` | | -- reserved -- +`B1` / `10110001` | | -- reserved -- +`B9` / `10111001` | | -- reserved -- +`C1` / `11000001` | | -- reserved -- +`C9` / `11001001` | | -- reserved -- +`D1` / `11010001` | | -- reserved -- +`D9` / `11011001` | | -- reserved -- +`E1` / `11100001` | | -- reserved -- +`E9` / `11101001` | | -- reserved -- +`F1` / `11110001` | | -- reserved -- +`F9` / `11111001` | | -- reserved -- + +opcode (hex / bin) | feature set | assembler mnemonic +------------------ | ----------- | ------------------ +`02` / `00000010` | | -- reserved -- +`0A` / `00001010` | | -- reserved -- +`12` / `00010010` | | -- reserved -- +`1A` / `00011010` | | -- reserved -- +`22` / `00100010` | | -- reserved -- +`2A` / `00101010` | | -- reserved -- +`32` / `00110010` | | -- reserved -- +`3A` / `00111010` | | -- reserved -- +`42` / `01000010` | | -- reserved -- +`4A` / `01001010` | | -- reserved -- +`52` / `01010010` | | -- reserved -- +`5A` / `01011010` | | -- reserved -- +`62` / `01100010` | all | `stw [dst + off], imm` +`6A` / `01101010` | all | `sth [dst + off], imm` +`72` / `01110010` | all | `stb [dst + off], imm` +`7A` / `01111010` | all | `stdw [dst + off], imm` +`82` / `10000010` | | -- reserved -- +`8A` / `10001010` | | -- reserved -- +`92` / `10010010` | | -- reserved -- +`9A` / `10011010` | | -- reserved -- +`A2` / `10100010` | | -- reserved -- +`AA` / `10101010` | | -- reserved -- +`B2` / `10110010` | | -- reserved -- +`BA` / `10111010` | | -- reserved -- +`C2` / `11000010` | | -- reserved -- +`CA` / `11001010` | | -- reserved -- +`D2` / `11010010` | | -- reserved -- +`DA` / `11011010` | | -- reserved -- +`E2` / `11100010` | | -- reserved -- +`EA` / `11101010` | | -- reserved -- +`F2` / `11110010` | | -- reserved -- +`FA` / `11111010` | | -- reserved -- + +opcode (hex / bin) | feature set | assembler mnemonic +------------------ | ----------- | ------------------ +`03` / `00000011` | | -- reserved -- +`0B` / `00001011` | | -- reserved -- +`13` / `00010011` | | -- reserved -- +`1B` / `00011011` | | -- reserved -- +`23` / `00100011` | | -- reserved -- +`2B` / `00101011` | | -- reserved -- +`33` / `00110011` | | -- reserved -- +`3B` / `00111011` | | -- reserved -- +`43` / `01000011` | | -- reserved -- +`4B` / `01001011` | | -- reserved -- +`53` / `01010011` | | -- reserved -- +`5B` / `01011011` | | -- reserved -- +`63` / `01100011` | all | `stxw [dst + off], src` +`6B` / `01101011` | all | `stxh [dst + off], src` +`73` / `01110011` | all | `stxb [dst + off], src` +`7B` / `01111011` | all | `stxdw [dst + off], src` +`83` / `10000011` | | -- reserved -- +`8B` / `10001011` | | -- reserved -- +`93` / `10010011` | | -- reserved -- +`9B` / `10011011` | | -- reserved -- +`A3` / `10100011` | | -- reserved -- +`AB` / `10101011` | | -- reserved -- +`B3` / `10110011` | | -- reserved -- +`BB` / `10111011` | | -- reserved -- +`C3` / `11000011` | | -- reserved -- +`CB` / `11001011` | | -- reserved -- +`D3` / `11010011` | | -- reserved -- +`DB` / `11011011` | | -- reserved -- +`E3` / `11100011` | | -- reserved -- +`EB` / `11101011` | | -- reserved -- +`F3` / `11110011` | | -- reserved -- +`FB` / `11111011` | | -- reserved -- + +### Control Flow + +The target location is the end of the current instruction offsetted by the signed `off` field. + +Call instructions (`call` and `callx` but not `syscall`) do: +- Save the registers `r6`, `r7`, `r8`, `r9` and the frame pointer `r10` +- If ≤ v1: Add one stack frame size to the frame pointer `r10` +- If ≥ v2: Move the stack pointer `r11` into the frame pointer `r10` + +The `exit` (a.k.a. return) instruction does: +- Restore the registers `r6`, `r7`, `r8`, `r9` and the frame pointer `r10` +- Or gracefully terminate the program if there is no stack frame to restore + +#### Panics +- Out of bounds: When the target location is outside the bytecode if ≤ v1. +- Out of bounds: When the target location is outside the current function if ≥ v2 and a jump. +- Out of bounds: When the target location is not a registered function if ≥ v2 and a call. +- Second slot of `lddw`: When the target location has opcode `0x00`. +- Stack overflow: When one too many nested call happens. + +opcode (hex / bin) | feature set | assembler mnemonic | condition Rust equivalent +------------------ | ----------- | -------------------- | ------------------------- +`05` / `00000101` | all | `ja off` | `true` +`0D` / `00001101` | | -- reserved -- +`15` / `00010101` | all | `jeq dst, imm, off` | `dst == (imm as i32 as i64 as u64)` +`1D` / `00011101` | all | `jeq dst, src, off` | `dst == src` +`25` / `00100101` | all | `jgt dst, imm, off` | `dst > (imm as i32 as i64 as u64)` +`2D` / `00101101` | all | `jgt dst, src, off` | `dst > src` +`35` / `00110101` | all | `jge dst, imm, off` | `dst >= (imm as i32 as i64 as u64)` +`3D` / `00111101` | all | `jge dst, src, off` | `dst >= src` +`45` / `01000101` | all | `jset dst, imm, off` | `dst.and(imm as i32 as i64 as u64) != 0` +`4D` / `01001101` | all | `jset dst, src, off` | `dst.and(src) != 0` +`55` / `01010101` | all | `jne dst, imm, off` | `dst != (imm as i32 as i64 as u64)` +`5D` / `01011101` | all | `jne dst, src, off` | `dst != src` +`65` / `01100101` | all | `jsgt dst, imm, off` | `(dst as i64) > (imm as i32 as i64)` +`6D` / `01101101` | all | `jsgt dst, src, off` | `(dst as i64) > (src as i64)` +`75` / `01110101` | all | `jsge dst, imm, off` | `(dst as i64) >= (imm as i32 as i64)` +`7D` / `01111101` | all | `jsge dst, src, off` | `(dst as i64) >= (src as i64)` +`85` / `10000101` | until v2 | `call off` +`85` / `10000101` | from v2 | `syscall src=0, off` +`85` / `10000101` | from v2 | `call src=1, off` +`8D` / `10001101` | until v2 | `callx imm` +`8D` / `10001101` | from v2 | `callx src` +`95` / `10010101` | all | `exit` +`9D` / `10011101` | | -- reserved -- +`A5` / `10100101` | all | `jlt dst, imm, off` | `dst < imm as i32 as i64 as u64` +`AD` / `10101101` | all | `jlt dst, src, off` | `dst < src` +`B5` / `10110101` | all | `jle dst, imm, off` | `dst <= imm as i32 as i64 as u64` +`BD` / `10111101` | all | `jle dst, src, off` | `dst <= src` +`C5` / `11000101` | all | `jslt dst, imm, off` | `(dst as i64) < (imm as i32 as i64)` +`CD` / `11001101` | all | `jslt dst, src, off` | `(dst as i64) < (src as i64)` +`D5` / `11010101` | all | `jsle dst, imm, off` | `(dst as i64) <= (imm as i32 as i64)` +`DD` / `11011101` | all | `jsle dst, src, off` | `(dst as i64) <= (src as i64)` +`E5` / `11100101` | | -- reserved -- +`ED` / `11101101` | | -- reserved -- +`F5` / `11110101` | | -- reserved -- +`FD` / `11111101` | | -- reserved -- + + +Verification +------------ + +### all +- The bytecode must be divisible by the instruction slot size (64 bits / 8 bytes) +- The bytecode must contain at least one instruction +- `lddw` (opcode `0x18`) is two slots long and must be followed by a slot with opcode `0x00` +- Immediate values of quotient and remainder instructions must be imm ≠ 0 +- Immediate values of 32 bit shift instructions must be 0 ≤ imm < 32 +- Immediate values of 64 bit shift instructions must be 0 ≤ imm < 64 +- Immediate values of byte swap instructions (`le` and `be`) must be 16, 32 or 64 +- The offset of jump instructions must not point to the second slot of a `lddw` instruction (opcode `0x00`) +- `callx` must not use r10 as source register +- For all instructions the source register must be `r0` ≤ src ≤ `r10` +- For all instructions (except for memory writes) the destination register must be `r0` ≤ dst ≤ `r9` +- For all instructions the opcode must be valid +- Memory write instructions can use `r10` as destination register + +### until v2 +- Opcodes from the product / quotient / remainder instruction class are forbiden +- `le` is allowed +- `callx` source register is encoded in the imm field +- The targets of `call` instructions is checked at runtime not verification time +- The offset of jump instructions must be limited to the range of the bytecode + +### from v2 +- Every function must end in a `ja` or `exit` instruction +- `lddw` (opcodes `0x18` and `0x00`) are forbidden +- `neg32` and `neg64` are forbidden +- Opcodes from the product / quotient / remainder instruction class are allowed +- `le` is forbidden +- `hor64` is allowed +- The offset of jump instructions must be limited to the range of the current function +- `callx` source register is encoded in the src field +- The targets of syscalls (`call` instructions with src ≠ 0) must have been registered at verification time +- `add64 reg, imm` can use `r11` as destination register