312 lines
13 KiB
NASM
Raw Normal View History

2022-07-22 14:35:41 -07:00
global sha2_store:
JUMPDEST
2022-07-25 15:09:36 -07:00
// stack: num_bytes, x[0], x[1], ..., x[num_bytes - 1], retdest
2022-07-22 14:35:41 -07:00
dup1
2022-07-25 15:09:36 -07:00
// stack: num_bytes, num_bytes, x[0], x[1], ..., x[num_bytes - 1], retdest
2022-07-22 14:35:41 -07:00
push 0
2022-07-25 15:09:36 -07:00
// stack: addr=0, num_bytes, num_bytes, x[0], x[1], ..., x[num_bytes - 1], retdest
2022-07-22 14:35:41 -07:00
%mstore_kernel_general
2022-07-28 10:25:20 -07:00
// stack: num_bytes, x[0], x[1], ..., x[num_bytes - 1], retdest
2022-07-22 14:35:41 -07:00
push 1
2022-07-25 15:09:36 -07:00
// stack: addr=1, counter=num_bytes, x[0], x[1], x[2], ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
sha2_store_loop:
JUMPDEST
2022-07-25 15:09:36 -07:00
// stack: addr, counter, x[num_bytes-counter], ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
dup1
2022-07-25 15:09:36 -07:00
// stack: addr, addr, counter, x[num_bytes-counter], ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
swap3
2022-07-25 15:09:36 -07:00
// stack: x[num_bytes-counter], addr, counter, addr, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
swap1
2022-07-25 15:09:36 -07:00
// stack: addr, x[num_bytes-counter], counter, addr, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
%mstore_kernel_general
2022-07-25 15:09:36 -07:00
// stack: counter, addr, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
%decrement
2022-07-25 15:09:36 -07:00
// stack: counter-1, addr, ... , x[num_bytes-1], retdest
2022-09-25 20:13:04 -07:00
dup1
// stack: counter-1, counter-1, addr, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
iszero
%jumpi(sha2_store_end)
2022-09-25 20:13:04 -07:00
// stack: counter-1, addr, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
swap1
2022-07-25 15:09:36 -07:00
// stack: addr, counter-1, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
%increment
2022-07-25 15:09:36 -07:00
// stack: addr+1, counter-1, ... , x[num_bytes-1], retdest
2022-07-22 14:35:41 -07:00
%jump(sha2_store_loop)
sha2_store_end:
2022-07-28 07:11:58 -07:00
JUMPDEST
2022-07-22 14:35:41 -07:00
// stack: counter=0, addr, retdest
%pop2
2022-09-25 20:13:04 -07:00
// stack: retdest
//JUMP
%jump(sha2_pad)
2022-08-01 16:36:36 -07:00
2022-07-22 14:35:41 -07:00
// Precodition: input is in memory, starting at 0 of kernel general segment, of the form
2022-07-21 15:04:33 -07:00
// num_bytes, x[0], x[1], ..., x[num_bytes - 1]
// Postcodition: output is in memory, starting at 0, of the form
// num_blocks, block0[0], ..., block0[63], block1[0], ..., blocklast[63]
2022-07-15 14:30:15 -07:00
global sha2_pad:
2022-07-28 07:11:58 -07:00
JUMPDEST
2022-07-19 13:56:35 -07:00
// stack: retdest
2022-07-14 14:58:28 -07:00
push 0
2022-07-25 15:49:27 -07:00
%mload_kernel_general
2022-07-19 13:56:35 -07:00
// stack: num_bytes, retdest
2022-07-18 16:12:28 -07:00
// STEP 1: append 1
2022-08-01 10:59:06 -07:00
// insert 128 (= 1 << 7) at x[num_bytes]
// stack: num_bytes, retdest
2022-08-08 15:30:54 -07:00
// TODO: these should be in the other order once SHL implementation is fixed
2022-08-01 10:59:06 -07:00
push 7
2022-08-08 15:30:54 -07:00
push 1
2022-08-01 10:59:06 -07:00
shl
// stack: 128, num_bytes, retdest
dup2
// stack: num_bytes, 128, num_bytes, retdest
%mstore_kernel_general
// stack: num_bytes, retdest
// STEP 2: calculate num_blocks := (num_bytes+8)//64 + 1
2022-07-15 14:30:15 -07:00
dup1
2022-07-19 13:56:35 -07:00
// stack: num_bytes, num_bytes, retdest
2022-08-01 15:05:42 -07:00
%add_const(8)
%div_const(64)
2022-08-01 10:59:06 -07:00
%increment
// stack: num_blocks = (num_bytes+8)//64 + 1, num_bytes, retdest
// STEP 3: calculate length := num_bytes*8+1
2022-07-15 14:30:15 -07:00
swap1
2022-08-01 10:59:06 -07:00
// stack: num_bytes, num_blocks, retdest
2022-07-18 16:12:28 -07:00
push 8
2022-07-15 14:30:15 -07:00
mul
%increment
2022-08-01 10:59:06 -07:00
// stack: length = num_bytes*8+1, num_blocks, retdest
// STEP 4: write length to x[num_blocks*64-8..num_blocks*64-1]
dup2
// stack: num_blocks, length, num_blocks, retdest
2022-07-18 16:12:28 -07:00
push 64
2022-07-15 14:30:15 -07:00
mul
2022-07-18 16:12:28 -07:00
%decrement
2022-08-01 10:59:06 -07:00
// stack: last_addr = num_blocks*64-1, length, num_blocks, retdest
%sha2_write_length
// stack: num_blocks, retdest
// STEP 5: write num_blocks to x[0]
2022-07-15 14:30:15 -07:00
push 0
2022-08-01 10:59:06 -07:00
%mstore_kernel_general
2022-07-19 13:56:35 -07:00
// stack: retdest
2022-08-01 16:29:57 -07:00
//JUMP
push 100
push 1
%jump(sha2_gen_message_schedule_from_block)
2022-07-18 16:12:28 -07:00
// Precodition: stack contains address of one message block, followed by output address
2022-08-08 15:30:54 -07:00
// Postcondition: 256 bytes starting at given output address contain the 64 32-bit chunks
2022-08-01 15:05:42 -07:00
// of message schedule (in four-byte increments)
2022-07-18 16:12:28 -07:00
global sha2_gen_message_schedule_from_block:
2022-07-14 09:29:29 -07:00
JUMPDEST
2022-07-19 13:56:35 -07:00
// stack: block_addr, output_addr, retdest
2022-07-18 16:50:40 -07:00
dup1
2022-07-19 13:56:35 -07:00
// stack: block_addr, block_addr, output_addr, retdest
2022-08-01 15:05:42 -07:00
%add_const(32)
// stack: block_addr + 32, block_addr, output_addr, retdest
2022-07-18 16:50:40 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: block_addr, block_addr + 32, output_addr, retdest
%mload_kernel_general_u256
// stack: block[0], block_addr + 32, output_addr, retdest
2022-07-18 16:50:40 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: block_addr + 32, block[0], output_addr, retdest
%mload_kernel_general_u256
2022-07-19 13:56:35 -07:00
// stack: block[1], block[0], output_addr, retdest
2022-07-18 16:50:40 -07:00
swap2
2022-07-19 13:56:35 -07:00
// stack: output_addr, block[0], block[1], retdest
push 8
// stack: counter=8, output_addr, block[0], block[1], retdest
2022-07-18 16:50:40 -07:00
%jump(sha2_gen_message_schedule_from_block_0_loop)
sha2_gen_message_schedule_from_block_0_loop:
JUMPDEST
2022-07-19 13:56:35 -07:00
// stack: counter, output_addr, block[0], block[1], retdest
2022-07-18 16:50:40 -07:00
swap2
2022-07-19 13:56:35 -07:00
// stack: block[0], output_addr, counter, block[1], retdest
2022-08-08 15:30:54 -07:00
// TODO: these should be in the other order once SHL implementation is fixed
2022-07-18 16:50:40 -07:00
push 32
2022-08-08 15:30:54 -07:00
push 1
2022-07-18 16:50:40 -07:00
shl
2022-07-19 13:56:35 -07:00
// stack: 1 << 32, block[0], output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
dup2
dup2
2022-07-19 13:56:35 -07:00
// stack: 1 << 32, block[0], 1 << 32, block[0], output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap1
2022-07-19 13:56:35 -07:00
// stack: block[0], 1 << 32, 1 << 32, block[0], output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
mod
2022-07-19 13:56:35 -07:00
// stack: block[0] % (1 << 32), 1 << 32, block[0], output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap2
2022-07-19 13:56:35 -07:00
// stack: block[0], 1 << 32, block[0] % (1 << 32), output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
div
2022-07-19 13:56:35 -07:00
// stack: block[0] // (1 << 32), block[0] % (1 << 32), output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap1
2022-07-19 13:56:35 -07:00
// stack: block[0] % (1 << 32), block[0] // (1 << 32), output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
dup3
2022-07-19 13:56:35 -07:00
// stack: output_addr, block[0] % (1 << 32), block[0] // (1 << 32), output_addr, counter, block[1], retdest
2022-08-01 15:05:42 -07:00
%mstore_kernel_general_u32
2022-07-19 13:56:35 -07:00
// stack: block[0] // (1 << 32), output_addr, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap1
2022-07-19 13:56:35 -07:00
// stack: output_addr, block[0] // (1 << 32), counter, block[1], retdest
2022-08-01 15:05:42 -07:00
%add_const(4)
// stack: output_addr + 4, block[0] // (1 << 32), counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: block[0] // (1 << 32), output_addr + 4, counter, block[1], retdest
2022-07-18 16:50:40 -07:00
swap2
2022-08-01 15:05:42 -07:00
// stack: counter, output_addr + 4, block[0] // (1 << 32), block[1], retdest
2022-07-18 16:50:40 -07:00
%decrement
dup1
iszero
%jumpi(sha2_gen_message_schedule_from_block_0_end)
%jump(sha2_gen_message_schedule_from_block_0_loop)
sha2_gen_message_schedule_from_block_0_end:
JUMPDEST
2022-07-19 13:56:35 -07:00
// stack: old counter=0, output_addr, block[0], block[1], retdest
2022-07-18 16:50:40 -07:00
pop
2022-07-19 13:56:35 -07:00
push 8
// stack: counter=8, output_addr, block[0], block[1], retdest
swap2
// stack: block[0], output_addr, counter, block[1], retdest
swap3
// stack: block[1], output_addr, counter, block[0], retdest
swap2
// stack: counter, output_addr, block[1], block[0], retdest
sha2_gen_message_schedule_from_block_1_loop:
JUMPDEST
// stack: counter, output_addr, block[1], block[0], retdest
swap2
// stack: block[1], output_addr, counter, block[0], retdest
2022-08-08 15:30:54 -07:00
// TODO: these should be in the other order once SHL implementation is fixed
2022-07-19 13:56:35 -07:00
push 32
2022-08-08 15:30:54 -07:00
push 1
2022-07-19 13:56:35 -07:00
shl
// stack: 1 << 32, block[1], output_addr, counter, block[0], retdest
dup2
dup2
// stack: 1 << 32, block[1], 1 << 32, block[1], output_addr, counter, block[0], retdest
swap1
// stack: block[1], 1 << 32, 1 << 32, block[1], output_addr, counter, block[0], retdest
mod
// stack: block[1] % (1 << 32), 1 << 32, block[1], output_addr, counter, block[0], retdest
swap2
// stack: block[1], 1 << 32, block[1] % (1 << 32), output_addr, counter, block[0], retdest
div
// stack: block[1] // (1 << 32), block[1] % (1 << 32), output_addr, counter, block[0], retdest
swap1
// stack: block[1] % (1 << 32), block[1] // (1 << 32), output_addr, counter, block[0], retdest
dup3
// stack: output_addr, block[1] % (1 << 32), block[1] // (1 << 32), output_addr, counter, block[0], retdest
2022-08-01 15:05:42 -07:00
%mstore_kernel_general_u32
2022-07-19 13:56:35 -07:00
// stack: block[1] // (1 << 32), output_addr, counter, block[0], retdest
swap1
// stack: output_addr, block[1] // (1 << 32), counter, block[0], retdest
2022-08-01 15:05:42 -07:00
%add_const(4)
// stack: output_addr + 4, block[1] // (1 << 32), counter, block[0], retdest
2022-07-19 13:56:35 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: block[1] // (1 << 32), output_addr + 4, counter, block[0], retdest
2022-07-19 13:56:35 -07:00
swap2
2022-08-01 15:05:42 -07:00
// stack: counter, output_addr + 4, block[1] // (1 << 32), block[0], retdest
2022-07-19 13:56:35 -07:00
%decrement
dup1
iszero
%jumpi(sha2_gen_message_schedule_from_block_1_end)
%jump(sha2_gen_message_schedule_from_block_1_loop)
sha2_gen_message_schedule_from_block_1_end:
JUMPDEST
// stack: old counter=0, output_addr, block[1], block[0], retdest
pop
// stack: output_addr, block[0], block[1], retdest
2022-07-19 14:19:19 -07:00
push 48
// stack: counter=48, output_addr, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
sha2_gen_message_schedule_remaining_loop:
2022-07-14 09:29:29 -07:00
JUMPDEST
2022-08-01 16:36:36 -07:00
// stack: counter, output_addr, block[0], block[1], retdest
swap1
// stack: output_addr, counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
dup1
2022-08-01 16:36:36 -07:00
// stack: output_addr, output_addr, counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
push 2
2022-08-01 15:05:42 -07:00
push 4
mul
2022-07-18 16:18:25 -07:00
swap1
sub
2022-08-01 15:05:42 -07:00
// stack: output_addr - 2*4, output_addr, counter, block[0], block[1], retdest
%mload_kernel_general_u32
// stack: x[output_addr - 2*4], output_addr, counter, block[0], block[1], retdest
2022-07-19 14:19:35 -07:00
%sha2_sigma_1
2022-08-01 15:05:42 -07:00
// stack: sigma_1(x[output_addr - 2*4]), output_addr, counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
dup1
2022-08-01 15:05:42 -07:00
// stack: output_addr, output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
push 7
2022-08-01 15:05:42 -07:00
push 4
mul
2022-07-18 16:18:25 -07:00
swap1
sub
2022-08-01 15:05:42 -07:00
// stack: output_addr - 7*4, output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
%mload_kernel_general_u32
// stack: x[output_addr - 7*4], output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
dup1
2022-08-01 15:05:42 -07:00
// stack: output_addr, output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
push 15
2022-08-01 15:05:42 -07:00
push 4
mul
2022-07-18 16:18:25 -07:00
swap1
sub
2022-08-01 15:05:42 -07:00
// stack: output_addr - 15*4, output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
%mload_kernel_general_u32
// stack: x[output_addr - 15*4], output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-19 14:19:35 -07:00
%sha2_sigma_0
2022-08-01 15:05:42 -07:00
// stack: sigma_0(x[output_addr - 15*4]), output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
dup1
2022-08-01 15:05:42 -07:00
// stack: output_addr, output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
push 16
2022-08-01 15:05:42 -07:00
push 4
mul
2022-07-18 16:18:25 -07:00
swap1
sub
2022-08-01 15:05:42 -07:00
// stack: output_addr - 16*4, output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
%mload_kernel_general_u32
// stack: x[output_addr - 16*4], output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, x[output_addr - 16*4], sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap4
2022-08-01 15:05:42 -07:00
// stack: sigma_1(x[output_addr - 2*4]), x[output_addr - 16*4], sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
add
add
add
2022-08-01 15:05:42 -07:00
// stack: sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], counter, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
dup1
2022-08-01 15:05:42 -07:00
// stack: output_addr, output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], counter, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
swap2
2022-08-01 15:05:42 -07:00
// stack: sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, output_addr, counter, block[0], block[1], retdest
2022-07-18 16:18:25 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest
%mstore_kernel_general_u32
2022-08-01 16:36:36 -07:00
// stack: output_addr, counter, block[0], block[1], retdest
2022-08-01 15:05:42 -07:00
%add_const(4)
// stack: output_addr + 4, counter, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
swap1
2022-08-01 15:05:42 -07:00
// stack: counter, output_addr + 4, block[0], block[1], retdest
2022-08-01 16:36:36 -07:00
%decrement
2022-08-01 15:05:42 -07:00
// stack: counter - 1, output_addr + 4, block[0], block[1], retdest
2022-08-01 16:29:57 -07:00
dup1
2022-08-01 16:36:36 -07:00
iszero
%jumpi(sha2_gen_message_schedule_remaining_end)
%jump(sha2_gen_message_schedule_remaining_loop)
sha2_gen_message_schedule_remaining_end:
JUMPDEST
2022-08-01 16:29:57 -07:00
// stack: counter=0, output_addr, block[0], block[1], retdest
%pop4
STOP
JUMP
2022-07-18 16:12:28 -07:00
2022-08-01 16:29:57 -07:00
//global sha2_gen_all_message_schedules:
// JUMPDEST