/* Copyright 2016-2017 INRIA and Microsoft Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "Hacl_Poly1305_64.h" inline static void Hacl_Bignum_Modulo_reduce(uint64_t *b) { uint64_t b0 = b[0U]; b[0U] = (b0 << (uint32_t)4U) + (b0 << (uint32_t)2U); } inline static void Hacl_Bignum_Modulo_carry_top(uint64_t *b) { uint64_t b2 = b[2U]; uint64_t b0 = b[0U]; uint64_t b2_42 = b2 >> (uint32_t)42U; b[2U] = b2 & (uint64_t)0x3ffffffffffU; b[0U] = (b2_42 << (uint32_t)2U) + b2_42 + b0; } inline static void Hacl_Bignum_Modulo_carry_top_wide(FStar_UInt128_t *b) { FStar_UInt128_t b2 = b[2U]; FStar_UInt128_t b0 = b[0U]; FStar_UInt128_t b2_ = FStar_UInt128_logand(b2, FStar_UInt128_uint64_to_uint128((uint64_t)0x3ffffffffffU)); uint64_t b2_42 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(b2, (uint32_t)42U)); FStar_UInt128_t b0_ = FStar_UInt128_add(b0, FStar_UInt128_uint64_to_uint128((b2_42 << (uint32_t)2U) + b2_42)); b[2U] = b2_; b[0U] = b0_; } inline static void Hacl_Bignum_Fproduct_copy_from_wide_(uint64_t *output, FStar_UInt128_t *input) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)3U; i = i + (uint32_t)1U) { FStar_UInt128_t xi = input[i]; output[i] = FStar_UInt128_uint128_to_uint64(xi); } } inline static void Hacl_Bignum_Fproduct_sum_scalar_multiplication_( FStar_UInt128_t *output, uint64_t *input, uint64_t s) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)3U; i = i + (uint32_t)1U) { FStar_UInt128_t xi = output[i]; uint64_t yi = input[i]; output[i] = FStar_UInt128_add_mod(xi, FStar_UInt128_mul_wide(yi, s)); } } inline static void Hacl_Bignum_Fproduct_carry_wide_(FStar_UInt128_t *tmp) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)2U; i = i + (uint32_t)1U) { uint32_t ctr = i; FStar_UInt128_t tctr = tmp[ctr]; FStar_UInt128_t tctrp1 = tmp[ctr + (uint32_t)1U]; uint64_t r0 = FStar_UInt128_uint128_to_uint64(tctr) & (uint64_t)0xfffffffffffU; FStar_UInt128_t c = FStar_UInt128_shift_right(tctr, (uint32_t)44U); tmp[ctr] = FStar_UInt128_uint64_to_uint128(r0); tmp[ctr + (uint32_t)1U] = FStar_UInt128_add(tctrp1, c); } } inline static void Hacl_Bignum_Fproduct_carry_limb_(uint64_t *tmp) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)2U; i = i + (uint32_t)1U) { uint32_t ctr = i; uint64_t tctr = tmp[ctr]; uint64_t tctrp1 = tmp[ctr + (uint32_t)1U]; uint64_t r0 = tctr & (uint64_t)0xfffffffffffU; uint64_t c = tctr >> (uint32_t)44U; tmp[ctr] = r0; tmp[ctr + (uint32_t)1U] = tctrp1 + c; } } inline static void Hacl_Bignum_Fmul_shift_reduce(uint64_t *output) { uint64_t tmp = output[2U]; for (uint32_t i = (uint32_t)0U; i < (uint32_t)2U; i = i + (uint32_t)1U) { uint32_t ctr = (uint32_t)3U - i - (uint32_t)1U; uint64_t z = output[ctr - (uint32_t)1U]; output[ctr] = z; } output[0U] = tmp; Hacl_Bignum_Modulo_reduce(output); } static void Hacl_Bignum_Fmul_mul_shift_reduce_(FStar_UInt128_t *output, uint64_t *input, uint64_t *input2) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)2U; i = i + (uint32_t)1U) { uint64_t input2i = input2[i]; Hacl_Bignum_Fproduct_sum_scalar_multiplication_(output, input, input2i); Hacl_Bignum_Fmul_shift_reduce(input); } uint32_t i = (uint32_t)2U; uint64_t input2i = input2[i]; Hacl_Bignum_Fproduct_sum_scalar_multiplication_(output, input, input2i); } inline static void Hacl_Bignum_Fmul_fmul(uint64_t *output, uint64_t *input, uint64_t *input2) { uint64_t tmp[3U] = { 0U }; memcpy(tmp, input, (uint32_t)3U * sizeof input[0U]); KRML_CHECK_SIZE(FStar_UInt128_uint64_to_uint128((uint64_t)0U), (uint32_t)3U); FStar_UInt128_t t[3U]; for (uint32_t _i = 0U; _i < (uint32_t)3U; ++_i) t[_i] = FStar_UInt128_uint64_to_uint128((uint64_t)0U); Hacl_Bignum_Fmul_mul_shift_reduce_(t, tmp, input2); Hacl_Bignum_Fproduct_carry_wide_(t); Hacl_Bignum_Modulo_carry_top_wide(t); Hacl_Bignum_Fproduct_copy_from_wide_(output, t); uint64_t i0 = output[0U]; uint64_t i1 = output[1U]; uint64_t i0_ = i0 & (uint64_t)0xfffffffffffU; uint64_t i1_ = i1 + (i0 >> (uint32_t)44U); output[0U] = i0_; output[1U] = i1_; } inline static void Hacl_Bignum_AddAndMultiply_add_and_multiply(uint64_t *acc, uint64_t *block, uint64_t *r) { for (uint32_t i = (uint32_t)0U; i < (uint32_t)3U; i = i + (uint32_t)1U) { uint64_t xi = acc[i]; uint64_t yi = block[i]; acc[i] = xi + yi; } Hacl_Bignum_Fmul_fmul(acc, acc, r); } inline static void Hacl_Impl_Poly1305_64_poly1305_update( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m) { Hacl_Impl_Poly1305_64_State_poly1305_state scrut0 = st; uint64_t *h = scrut0.h; uint64_t *acc = h; Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *r = scrut.r; uint64_t *r3 = r; uint64_t tmp[3U] = { 0U }; FStar_UInt128_t m0 = load128_le(m); uint64_t r0 = FStar_UInt128_uint128_to_uint64(m0) & (uint64_t)0xfffffffffffU; uint64_t r1 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(m0, (uint32_t)44U)) & (uint64_t)0xfffffffffffU; uint64_t r2 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(m0, (uint32_t)88U)); tmp[0U] = r0; tmp[1U] = r1; tmp[2U] = r2; uint64_t b2 = tmp[2U]; uint64_t b2_ = (uint64_t)0x10000000000U | b2; tmp[2U] = b2_; Hacl_Bignum_AddAndMultiply_add_and_multiply(acc, tmp, r3); } inline static void Hacl_Impl_Poly1305_64_poly1305_process_last_block_( uint8_t *block, Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint64_t rem_) { uint64_t tmp[3U] = { 0U }; FStar_UInt128_t m0 = load128_le(block); uint64_t r0 = FStar_UInt128_uint128_to_uint64(m0) & (uint64_t)0xfffffffffffU; uint64_t r1 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(m0, (uint32_t)44U)) & (uint64_t)0xfffffffffffU; uint64_t r2 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(m0, (uint32_t)88U)); tmp[0U] = r0; tmp[1U] = r1; tmp[2U] = r2; Hacl_Impl_Poly1305_64_State_poly1305_state scrut0 = st; uint64_t *h = scrut0.h; Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *r = scrut.r; Hacl_Bignum_AddAndMultiply_add_and_multiply(h, tmp, r); } inline static void Hacl_Impl_Poly1305_64_poly1305_process_last_block( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint64_t rem_) { uint8_t zero1 = (uint8_t)0U; KRML_CHECK_SIZE(zero1, (uint32_t)16U); uint8_t block[16U]; for (uint32_t _i = 0U; _i < (uint32_t)16U; ++_i) block[_i] = zero1; uint32_t i0 = (uint32_t)rem_; uint32_t i = (uint32_t)rem_; memcpy(block, m, i * sizeof m[0U]); block[i0] = (uint8_t)1U; Hacl_Impl_Poly1305_64_poly1305_process_last_block_(block, st, m, rem_); } static void Hacl_Impl_Poly1305_64_poly1305_last_pass(uint64_t *acc) { Hacl_Bignum_Fproduct_carry_limb_(acc); Hacl_Bignum_Modulo_carry_top(acc); uint64_t a0 = acc[0U]; uint64_t a10 = acc[1U]; uint64_t a20 = acc[2U]; uint64_t a0_ = a0 & (uint64_t)0xfffffffffffU; uint64_t r0 = a0 >> (uint32_t)44U; uint64_t a1_ = (a10 + r0) & (uint64_t)0xfffffffffffU; uint64_t r1 = (a10 + r0) >> (uint32_t)44U; uint64_t a2_ = a20 + r1; acc[0U] = a0_; acc[1U] = a1_; acc[2U] = a2_; Hacl_Bignum_Modulo_carry_top(acc); uint64_t i0 = acc[0U]; uint64_t i1 = acc[1U]; uint64_t i0_ = i0 & (uint64_t)0xfffffffffffU; uint64_t i1_ = i1 + (i0 >> (uint32_t)44U); acc[0U] = i0_; acc[1U] = i1_; uint64_t a00 = acc[0U]; uint64_t a1 = acc[1U]; uint64_t a2 = acc[2U]; uint64_t mask0 = FStar_UInt64_gte_mask(a00, (uint64_t)0xffffffffffbU); uint64_t mask1 = FStar_UInt64_eq_mask(a1, (uint64_t)0xfffffffffffU); uint64_t mask2 = FStar_UInt64_eq_mask(a2, (uint64_t)0x3ffffffffffU); uint64_t mask = (mask0 & mask1) & mask2; uint64_t a0_0 = a00 - ((uint64_t)0xffffffffffbU & mask); uint64_t a1_0 = a1 - ((uint64_t)0xfffffffffffU & mask); uint64_t a2_0 = a2 - ((uint64_t)0x3ffffffffffU & mask); acc[0U] = a0_0; acc[1U] = a1_0; acc[2U] = a2_0; } static Hacl_Impl_Poly1305_64_State_poly1305_state Hacl_Impl_Poly1305_64_mk_state(uint64_t *r, uint64_t *h) { return ((Hacl_Impl_Poly1305_64_State_poly1305_state){.r = r, .h = h }); } static void Hacl_Standalone_Poly1305_64_poly1305_blocks( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint64_t len1) { if (!(len1 == (uint64_t)0U)) { uint8_t *block = m; uint8_t *tail1 = m + (uint32_t)16U; Hacl_Impl_Poly1305_64_poly1305_update(st, block); uint64_t len2 = len1 - (uint64_t)1U; Hacl_Standalone_Poly1305_64_poly1305_blocks(st, tail1, len2); } } static void Hacl_Standalone_Poly1305_64_poly1305_partial( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *input, uint64_t len1, uint8_t *kr) { Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *r = scrut.r; uint64_t *x0 = r; FStar_UInt128_t k1 = load128_le(kr); FStar_UInt128_t k_clamped = FStar_UInt128_logand(k1, FStar_UInt128_logor(FStar_UInt128_shift_left(FStar_UInt128_uint64_to_uint128((uint64_t)0x0ffffffc0ffffffcU), (uint32_t)64U), FStar_UInt128_uint64_to_uint128((uint64_t)0x0ffffffc0fffffffU))); uint64_t r0 = FStar_UInt128_uint128_to_uint64(k_clamped) & (uint64_t)0xfffffffffffU; uint64_t r1 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(k_clamped, (uint32_t)44U)) & (uint64_t)0xfffffffffffU; uint64_t r2 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(k_clamped, (uint32_t)88U)); x0[0U] = r0; x0[1U] = r1; x0[2U] = r2; Hacl_Impl_Poly1305_64_State_poly1305_state scrut0 = st; uint64_t *h = scrut0.h; uint64_t *x00 = h; x00[0U] = (uint64_t)0U; x00[1U] = (uint64_t)0U; x00[2U] = (uint64_t)0U; Hacl_Standalone_Poly1305_64_poly1305_blocks(st, input, len1); } static void Hacl_Standalone_Poly1305_64_poly1305_complete( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint64_t len1, uint8_t *k1) { uint8_t *kr = k1; uint64_t len16 = len1 >> (uint32_t)4U; uint64_t rem16 = len1 & (uint64_t)0xfU; uint8_t *part_input = m; uint8_t *last_block = m + (uint32_t)((uint64_t)16U * len16); Hacl_Standalone_Poly1305_64_poly1305_partial(st, part_input, len16, kr); if (!(rem16 == (uint64_t)0U)) Hacl_Impl_Poly1305_64_poly1305_process_last_block(st, last_block, rem16); Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *h = scrut.h; uint64_t *acc = h; Hacl_Impl_Poly1305_64_poly1305_last_pass(acc); } static void Hacl_Standalone_Poly1305_64_crypto_onetimeauth_( uint8_t *output, uint8_t *input, uint64_t len1, uint8_t *k1) { uint64_t buf[6U] = { 0U }; uint64_t *r = buf; uint64_t *h = buf + (uint32_t)3U; Hacl_Impl_Poly1305_64_State_poly1305_state st = Hacl_Impl_Poly1305_64_mk_state(r, h); uint8_t *key_s = k1 + (uint32_t)16U; Hacl_Standalone_Poly1305_64_poly1305_complete(st, input, len1, k1); Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *h3 = scrut.h; uint64_t *acc = h3; FStar_UInt128_t k_ = load128_le(key_s); uint64_t h0 = acc[0U]; uint64_t h1 = acc[1U]; uint64_t h2 = acc[2U]; FStar_UInt128_t acc_ = FStar_UInt128_logor(FStar_UInt128_shift_left(FStar_UInt128_uint64_to_uint128(h2 << (uint32_t)24U | h1 >> (uint32_t)20U), (uint32_t)64U), FStar_UInt128_uint64_to_uint128(h1 << (uint32_t)44U | h0)); FStar_UInt128_t mac_ = FStar_UInt128_add_mod(acc_, k_); store128_le(output, mac_); } static void Hacl_Standalone_Poly1305_64_crypto_onetimeauth( uint8_t *output, uint8_t *input, uint64_t len1, uint8_t *k1) { Hacl_Standalone_Poly1305_64_crypto_onetimeauth_(output, input, len1, k1); } Hacl_Impl_Poly1305_64_State_poly1305_state Hacl_Poly1305_64_mk_state(uint64_t *r, uint64_t *acc) { return Hacl_Impl_Poly1305_64_mk_state(r, acc); } void Hacl_Poly1305_64_init(Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *k1) { Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *r = scrut.r; uint64_t *x0 = r; FStar_UInt128_t k10 = load128_le(k1); FStar_UInt128_t k_clamped = FStar_UInt128_logand(k10, FStar_UInt128_logor(FStar_UInt128_shift_left(FStar_UInt128_uint64_to_uint128((uint64_t)0x0ffffffc0ffffffcU), (uint32_t)64U), FStar_UInt128_uint64_to_uint128((uint64_t)0x0ffffffc0fffffffU))); uint64_t r0 = FStar_UInt128_uint128_to_uint64(k_clamped) & (uint64_t)0xfffffffffffU; uint64_t r1 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(k_clamped, (uint32_t)44U)) & (uint64_t)0xfffffffffffU; uint64_t r2 = FStar_UInt128_uint128_to_uint64(FStar_UInt128_shift_right(k_clamped, (uint32_t)88U)); x0[0U] = r0; x0[1U] = r1; x0[2U] = r2; Hacl_Impl_Poly1305_64_State_poly1305_state scrut0 = st; uint64_t *h = scrut0.h; uint64_t *x00 = h; x00[0U] = (uint64_t)0U; x00[1U] = (uint64_t)0U; x00[2U] = (uint64_t)0U; } void Hacl_Poly1305_64_update_block(Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m) { Hacl_Impl_Poly1305_64_poly1305_update(st, m); } void Hacl_Poly1305_64_update( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint32_t num_blocks) { if (!(num_blocks == (uint32_t)0U)) { uint8_t *block = m; uint8_t *m_ = m + (uint32_t)16U; uint32_t n1 = num_blocks - (uint32_t)1U; Hacl_Poly1305_64_update_block(st, block); Hacl_Poly1305_64_update(st, m_, n1); } } void Hacl_Poly1305_64_update_last( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *m, uint32_t len1) { if (!((uint64_t)len1 == (uint64_t)0U)) Hacl_Impl_Poly1305_64_poly1305_process_last_block(st, m, (uint64_t)len1); Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *h = scrut.h; uint64_t *acc = h; Hacl_Impl_Poly1305_64_poly1305_last_pass(acc); } void Hacl_Poly1305_64_finish( Hacl_Impl_Poly1305_64_State_poly1305_state st, uint8_t *mac, uint8_t *k1) { Hacl_Impl_Poly1305_64_State_poly1305_state scrut = st; uint64_t *h = scrut.h; uint64_t *acc = h; FStar_UInt128_t k_ = load128_le(k1); uint64_t h0 = acc[0U]; uint64_t h1 = acc[1U]; uint64_t h2 = acc[2U]; FStar_UInt128_t acc_ = FStar_UInt128_logor(FStar_UInt128_shift_left(FStar_UInt128_uint64_to_uint128(h2 << (uint32_t)24U | h1 >> (uint32_t)20U), (uint32_t)64U), FStar_UInt128_uint64_to_uint128(h1 << (uint32_t)44U | h0)); FStar_UInt128_t mac_ = FStar_UInt128_add_mod(acc_, k_); store128_le(mac, mac_); } void Hacl_Poly1305_64_crypto_onetimeauth( uint8_t *output, uint8_t *input, uint64_t len1, uint8_t *k1) { Hacl_Standalone_Poly1305_64_crypto_onetimeauth(output, input, len1, k1); }