src/util/bigmath.h

01e04c3fSmrg/*
01e04c3fSmrg * Copyright © 2018 Intel Corporation
01e04c3fSmrg *
01e04c3fSmrg * Permission is hereby granted, free of charge, to any person obtaining a
01e04c3fSmrg * copy of this software and associated documentation files (the "Software"),
01e04c3fSmrg * to deal in the Software without restriction, including without limitation
01e04c3fSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
01e04c3fSmrg * and/or sell copies of the Software, and to permit persons to whom the
01e04c3fSmrg * Software is furnished to do so, subject to the following conditions:
01e04c3fSmrg *
01e04c3fSmrg * The above copyright notice and this permission notice (including the next
01e04c3fSmrg * paragraph) shall be included in all copies or substantial portions of the
01e04c3fSmrg * Software.
01e04c3fSmrg *
01e04c3fSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
01e04c3fSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
01e04c3fSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
01e04c3fSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
01e04c3fSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
01e04c3fSmrg * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
01e04c3fSmrg * IN THE SOFTWARE.
01e04c3fSmrg */
01e04c3fSmrg
01e04c3fSmrg#ifndef UTIL_BIGMATH_H
01e04c3fSmrg#define UTIL_BIGMATH_H
01e04c3fSmrg
01e04c3fSmrg#include "macros.h"
01e04c3fSmrg
01e04c3fSmrg#include <assert.h>
01e04c3fSmrg#include <stdint.h>
01e04c3fSmrg#include <string.h>
01e04c3fSmrg
01e04c3fSmrgstatic inline bool
01e04c3fSmrg_ubm_add_u32arr(uint32_t *dst, unsigned dst_len,
01e04c3fSmrg                uint32_t *a, unsigned a_len,
01e04c3fSmrg                uint32_t *b, unsigned b_len)
01e04c3fSmrg{
01e04c3fSmrg   uint32_t carry = 0;
01e04c3fSmrg   for (unsigned i = 0; i < dst_len; i++) {
01e04c3fSmrg      uint64_t sum = carry;
01e04c3fSmrg      if (i < a_len)
01e04c3fSmrg         sum += a[i];
01e04c3fSmrg      if (i < b_len)
01e04c3fSmrg         sum += b[i];
01e04c3fSmrg      dst[i] = sum;
01e04c3fSmrg      carry = sum >> 32;
01e04c3fSmrg   }
01e04c3fSmrg
01e04c3fSmrg   /* Now compute overflow */
01e04c3fSmrg
01e04c3fSmrg   for (unsigned i = dst_len; i < a_len; i++) {
01e04c3fSmrg      if (a[i])
01e04c3fSmrg         return true;
01e04c3fSmrg   }
01e04c3fSmrg
01e04c3fSmrg   for (unsigned i = dst_len; i < b_len; i++) {
01e04c3fSmrg      if (b[i])
01e04c3fSmrg         return true;
01e04c3fSmrg   }
01e04c3fSmrg
01e04c3fSmrg   return carry;
01e04c3fSmrg}
01e04c3fSmrg#define ubm_add_u32arr(dst, a, b) \
01e04c3fSmrg   _ubm_add_u32arr(dst, ARRAY_SIZE(dst), a, ARRAY_SIZE(a), b, ARRAY_SIZE(b))
01e04c3fSmrg
01e04c3fSmrgstatic inline bool
01e04c3fSmrg_ubm_mul_u32arr(uint32_t *dst, unsigned dst_len,
01e04c3fSmrg                uint32_t *a, unsigned a_len,
01e04c3fSmrg                uint32_t *b, unsigned b_len)
01e04c3fSmrg{
01e04c3fSmrg   memset(dst, 0, dst_len * sizeof(*dst));
01e04c3fSmrg
01e04c3fSmrg   bool overflow = false;
01e04c3fSmrg
01e04c3fSmrg   for (unsigned i = 0; i < a_len; i++) {
01e04c3fSmrg      uint32_t carry = 0;
01e04c3fSmrg      for (unsigned j = 0; j < b_len; j++) {
01e04c3fSmrg         /* The maximum values of a[i] and b[i] are UINT32_MAX so the maximum
01e04c3fSmrg          * value of tmp is UINT32_MAX * UINT32_MAX.  The maximum value that
01e04c3fSmrg          * will fit in tmp is
01e04c3fSmrg          *
01e04c3fSmrg          *    UINT64_MAX = UINT32_MAX << 32 + UINT32_MAX
01e04c3fSmrg          *               = UINT32_MAX * (UINT32_MAX + 1) + UINT32_MAX
01e04c3fSmrg          *               = UINT32_MAX * UINT32_MAX + 2 * UINT32_MAX
01e04c3fSmrg          *
01e04c3fSmrg          * so we're guaranteed that we can add in two more 32-bit values
01e04c3fSmrg          * without overflowing tmp.
01e04c3fSmrg          */
01e04c3fSmrg         uint64_t tmp = (uint64_t)a[i] * (uint64_t)b[j];
01e04c3fSmrg         tmp += carry;
01e04c3fSmrg         if (i + j < dst_len) {
01e04c3fSmrg            tmp += dst[i + j];
01e04c3fSmrg            dst[i + j] = tmp;
01e04c3fSmrg            carry = tmp >> 32;
01e04c3fSmrg         } else {
01e04c3fSmrg            /* We're trying to write a value that doesn't fit */
01e04c3fSmrg            overflow = overflow || tmp > 0;
01e04c3fSmrg            break;
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      if (i + b_len < dst_len)
01e04c3fSmrg         dst[i + b_len] = carry;
01e04c3fSmrg      else
01e04c3fSmrg         overflow = overflow || carry > 0;
01e04c3fSmrg   }
01e04c3fSmrg
01e04c3fSmrg   return overflow;
01e04c3fSmrg}
01e04c3fSmrg#define ubm_mul_u32arr(dst, a, b) \
01e04c3fSmrg   _ubm_mul_u32arr(dst, ARRAY_SIZE(dst), a, ARRAY_SIZE(a), b, ARRAY_SIZE(b))
01e04c3fSmrg
01e04c3fSmrg#endif /* UTIL_BIGMATH_H */