Path: blob/main/contrib/bearssl/src/int/i31_mulacc.c
39482 views
/*1* Copyright (c) 2016 Thomas Pornin <[email protected]>2*3* Permission is hereby granted, free of charge, to any person obtaining4* a copy of this software and associated documentation files (the5* "Software"), to deal in the Software without restriction, including6* without limitation the rights to use, copy, modify, merge, publish,7* distribute, sublicense, and/or sell copies of the Software, and to8* permit persons to whom the Software is furnished to do so, subject to9* the following conditions:10*11* The above copyright notice and this permission notice shall be12* included in all copies or substantial portions of the Software.13*14* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,15* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF16* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND17* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS18* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN19* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN20* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE21* SOFTWARE.22*/2324#include "inner.h"2526/* see inner.h */27void28br_i31_mulacc(uint32_t *d, const uint32_t *a, const uint32_t *b)29{30size_t alen, blen, u;31uint32_t dl, dh;3233alen = (a[0] + 31) >> 5;34blen = (b[0] + 31) >> 5;3536/*37* We want to add the two bit lengths, but these are encoded,38* which requires some extra care.39*/40dl = (a[0] & 31) + (b[0] & 31);41dh = (a[0] >> 5) + (b[0] >> 5);42d[0] = (dh << 5) + dl + (~(uint32_t)(dl - 31) >> 31);4344for (u = 0; u < blen; u ++) {45uint32_t f;46size_t v;4748/*49* Carry always fits on 31 bits; we want to keep it in a50* 32-bit register on 32-bit architectures (on a 64-bit51* architecture, cast down from 64 to 32 bits means52* clearing the high bits, which is not free; on a 32-bit53* architecture, the same operation really means ignoring54* the top register, which has negative or zero cost).55*/56#if BR_6457uint64_t cc;58#else59uint32_t cc;60#endif6162f = b[1 + u];63cc = 0;64for (v = 0; v < alen; v ++) {65uint64_t z;6667z = (uint64_t)d[1 + u + v] + MUL31(f, a[1 + v]) + cc;68cc = z >> 31;69d[1 + u + v] = (uint32_t)z & 0x7FFFFFFF;70}71d[1 + u + alen] = (uint32_t)cc;72}73}747576