// Precodition: stack contains address of one message block, followed by output address // Postcondition: 256 bytes starting at given output address contain the 64 32-bit chunks // of message schedule (in four-byte increments) global sha2_gen_message_schedule_from_block: // stack: block_addr, output_addr, retdest dup1 // stack: block_addr, block_addr, output_addr, retdest %add_const(32) // stack: block_addr + 32, block_addr, output_addr, retdest swap1 // stack: block_addr, block_addr + 32, output_addr, retdest %mload_kernel_general_u256 // stack: block[0], block_addr + 32, output_addr, retdest swap1 // stack: block_addr + 32, block[0], output_addr, retdest %mload_kernel_general_u256 // stack: block[1], block[0], output_addr, retdest swap2 // stack: output_addr, block[0], block[1], retdest %add_const(28) push 8 // stack: counter=8, output_addr + 28, block[0], block[1], retdest %jump(sha2_gen_message_schedule_from_block_0_loop) sha2_gen_message_schedule_from_block_0_loop: // Split the first half (256 bits) of the block into the first eight (32-bit) chunks of the message sdchedule. // stack: counter, output_addr, block[0], block[1], retdest swap2 // stack: block[0], output_addr, counter, block[1], retdest push 1 push 32 shl // stack: 1 << 32, block[0], output_addr, counter, block[1], retdest dup2 dup2 // stack: 1 << 32, block[0], 1 << 32, block[0], output_addr, counter, block[1], retdest swap1 // stack: block[0], 1 << 32, 1 << 32, block[0], output_addr, counter, block[1], retdest mod // stack: block[0] % (1 << 32), 1 << 32, block[0], output_addr, counter, block[1], retdest swap2 // stack: block[0], 1 << 32, block[0] % (1 << 32), output_addr, counter, block[1], retdest div // stack: block[0] >> 32, block[0] % (1 << 32), output_addr, counter, block[1], retdest swap1 // stack: block[0] % (1 << 32), block[0] >> 32, output_addr, counter, block[1], retdest dup3 // stack: output_addr, block[0] % (1 << 32), block[0] >> 32, output_addr, counter, block[1], retdest %mstore_kernel_general_u32 // stack: block[0] >> 32, output_addr, counter, block[1], retdest swap1 // stack: output_addr, block[0] >> 32, counter, block[1], retdest %sub_const(4) // stack: output_addr - 4, block[0] >> 32, counter, block[1], retdest swap1 // stack: block[0] >> 32, output_addr - 4, counter, block[1], retdest swap2 // stack: counter, output_addr - 4, block[0] >> 32, block[1], retdest %decrement dup1 iszero %jumpi(sha2_gen_message_schedule_from_block_0_end) %jump(sha2_gen_message_schedule_from_block_0_loop) sha2_gen_message_schedule_from_block_0_end: // stack: old counter=0, output_addr, block[0], block[1], retdest pop push 8 // stack: counter=8, output_addr, block[0], block[1], retdest swap2 // stack: block[0], output_addr, counter, block[1], retdest swap3 // stack: block[1], output_addr, counter, block[0], retdest swap2 // stack: counter, output_addr, block[1], block[0], retdest swap1 // stack: output_addr, counter, block[1], block[0], retdest %add_const(64) // stack: output_addr + 64, counter, block[1], block[0], retdest swap1 // stack: counter, output_addr + 64, block[1], block[0], retdest sha2_gen_message_schedule_from_block_1_loop: // Split the second half (256 bits) of the block into the next eight (32-bit) chunks of the message sdchedule. // stack: counter, output_addr, block[1], block[0], retdest swap2 // stack: block[1], output_addr, counter, block[0], retdest push 1 push 32 shl // stack: 1 << 32, block[1], output_addr, counter, block[0], retdest dup2 dup2 // stack: 1 << 32, block[1], 1 << 32, block[1], output_addr, counter, block[0], retdest swap1 // stack: block[1], 1 << 32, 1 << 32, block[1], output_addr, counter, block[0], retdest mod // stack: block[1] % (1 << 32), 1 << 32, block[1], output_addr, counter, block[0], retdest swap2 // stack: block[1], 1 << 32, block[1] % (1 << 32), output_addr, counter, block[0], retdest div // stack: block[1] >> 32, block[1] % (1 << 32), output_addr, counter, block[0], retdest swap1 // stack: block[1] % (1 << 32), block[1] >> 32, output_addr, counter, block[0], retdest dup3 // stack: output_addr, block[1] % (1 << 32), block[1] >> 32, output_addr, counter, block[0], retdest %mstore_kernel_general_u32 // stack: block[1] >> 32, output_addr, counter, block[0], retdest swap1 // stack: output_addr, block[1] >> 32, counter, block[0], retdest %sub_const(4) // stack: output_addr - 4, block[1] >> 32, counter, block[0], retdest swap1 // stack: block[1] >> 32, output_addr - 4, counter, block[0], retdest swap2 // stack: counter, output_addr - 4, block[1] >> 32, block[0], retdest %decrement dup1 iszero %jumpi(sha2_gen_message_schedule_from_block_1_end) %jump(sha2_gen_message_schedule_from_block_1_loop) sha2_gen_message_schedule_from_block_1_end: // stack: old counter=0, output_addr, block[1], block[0], retdest pop // stack: output_addr, block[0], block[1], retdest push 48 // stack: counter=48, output_addr, block[0], block[1], retdest swap1 // stack: output_addr, counter, block[0], block[1], retdest %add_const(36) // stack: output_addr + 36, counter, block[0], block[1], retdest swap1 // stack: counter, output_addr + 36, block[0], block[1], retdest sha2_gen_message_schedule_remaining_loop: // Generate the next 48 chunks of the message schedule, one at a time, from prior chunks. // stack: counter, output_addr, block[0], block[1], retdest swap1 // stack: output_addr, counter, block[0], block[1], retdest dup1 // stack: output_addr, output_addr, counter, block[0], block[1], retdest push 2 push 4 mul swap1 sub // stack: output_addr - 2*4, output_addr, counter, block[0], block[1], retdest %mload_kernel_general_u32 // stack: x[output_addr - 2*4], output_addr, counter, block[0], block[1], retdest %sha2_sigma_1 // stack: sigma_1(x[output_addr - 2*4]), output_addr, counter, block[0], block[1], retdest swap1 // stack: output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest dup1 // stack: output_addr, output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest push 7 push 4 mul swap1 sub // stack: output_addr - 7*4, output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest %mload_kernel_general_u32 // stack: x[output_addr - 7*4], output_addr, sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest swap1 // stack: output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest dup1 // stack: output_addr, output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest push 15 push 4 mul swap1 sub // stack: output_addr - 15*4, output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest %mload_kernel_general_u32 // stack: x[output_addr - 15*4], output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest %sha2_sigma_0 // stack: sigma_0(x[output_addr - 15*4]), output_addr, x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest swap1 // stack: output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest dup1 // stack: output_addr, output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest push 16 push 4 mul swap1 sub // stack: output_addr - 16*4, output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest %mload_kernel_general_u32 // stack: x[output_addr - 16*4], output_addr, sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest swap1 // stack: output_addr, x[output_addr - 16*4], sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], sigma_1(x[output_addr - 2*4]), counter, block[0], block[1], retdest swap4 // stack: sigma_1(x[output_addr - 2*4]), x[output_addr - 16*4], sigma_0(x[output_addr - 15*4]), x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest %add_u32 %add_u32 %add_u32 // stack: sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest swap1 // stack: output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], counter, block[0], block[1], retdest dup1 // stack: output_addr, output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], counter, block[0], block[1], retdest swap2 // stack: sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, output_addr, counter, block[0], block[1], retdest swap1 // stack: output_addr, sigma_1(x[output_addr - 2*4]) + x[output_addr - 16*4] + sigma_0(x[output_addr - 15*4]) + x[output_addr - 7*4], output_addr, counter, block[0], block[1], retdest %mstore_kernel_general_u32 // stack: output_addr, counter, block[0], block[1], retdest %add_const(4) // stack: output_addr + 4, counter, block[0], block[1], retdest swap1 // stack: counter, output_addr + 4, block[0], block[1], retdest %decrement // stack: counter - 1, output_addr + 4, block[0], block[1], retdest dup1 iszero %jumpi(sha2_gen_message_schedule_remaining_end) %jump(sha2_gen_message_schedule_remaining_loop) sha2_gen_message_schedule_remaining_end: // stack: counter=0, output_addr, block[0], block[1], retdest %pop4 JUMP // Precodition: memory, starting at 0, contains num_blocks, block0[0], ..., block0[63], block1[0], ..., blocklast[63] // stack contains output_addr // Postcondition: starting at output_addr, set of 256 bytes per block // each contains the 64 32-bit chunks of the message schedule for that block (in four-byte increments) global sha2_gen_all_message_schedules: // stack: output_addr, retdest dup1 // stack: output_addr, output_addr, retdest push 0 // stack: 0, output_addr, output_addr, retdest %mload_kernel_general // stack: num_blocks, output_addr, output_addr, retdest push 1 // stack: cur_addr = 1, counter = num_blocks, output_addr, output_addr, retdest sha2_gen_all_message_schedules_loop: // stack: cur_addr, counter, cur_output_addr, output_addr, retdest push sha2_gen_all_message_schedules_loop_end // stack: new_retdest = sha2_gen_all_message_schedules_loop_end, cur_addr, counter, cur_output_addr, output_addr, retdest dup4 // stack: cur_output_addr, new_retdest, cur_addr, counter, cur_output_addr, output_addr, retdest dup3 // stack: cur_addr, cur_output_addr, new_retdest, cur_addr, counter, cur_output_addr, output_addr, retdest %jump(sha2_gen_message_schedule_from_block) sha2_gen_all_message_schedules_loop_end: // stack: cur_addr, counter, cur_output_addr, output_addr, retdest %add_const(64) // stack: cur_addr + 64, counter, cur_output_addr, output_addr, retdest swap1 %decrement swap1 // stack: cur_addr + 64, counter - 1, cur_output_addr, output_addr, retdest swap2 %add_const(256) swap2 // stack: cur_addr + 64, counter - 1, cur_output_addr + 256, output_addr, retdest dup2 // stack: counter - 1, cur_addr + 64, counter - 1, cur_output_addr + 256, output_addr, retdest iszero %jumpi(sha2_gen_all_message_schedules_end) %jump(sha2_gen_all_message_schedules_loop) sha2_gen_all_message_schedules_end: // stack: cur_addr + 64, counter - 1, cur_output_addr + 256, output_addr, retdest %pop3 // stack: output_addr, retdest %jump(sha2_compression)