/* * Copyright (C) 2012 Michael Brown . * Copyright (c) 2023, Xiaotian Wu * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License as * published by the Free Software Foundation; either version 2 of the * License, or any later version. * * This program is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA * 02110-1301, USA. * * You can also choose to distribute this program under the terms of * the Unmodified Binary Distribution Licence (as given in the file * COPYING.UBDL), provided that you have satisfied its requirements. */ FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL ); #include #include #include /** @file * * Big integer support */ /** * Multiply big integers * * @v multiplicand0 Element 0 of big integer to be multiplied * @v multiplier0 Element 0 of big integer to be multiplied * @v result0 Element 0 of big integer to hold result * @v size Number of elements */ void bigint_multiply_raw ( const uint64_t *multiplicand0, const uint64_t *multiplier0, uint64_t *result0, unsigned int size ) { const bigint_t ( size ) __attribute__ (( may_alias )) *multiplicand = ( ( const void * ) multiplicand0 ); const bigint_t ( size ) __attribute__ (( may_alias )) *multiplier = ( ( const void * ) multiplier0 ); bigint_t ( size * 2 ) __attribute__ (( may_alias )) *result = ( ( void * ) result0 ); unsigned int i; unsigned int j; uint64_t multiplicand_element; uint64_t multiplier_element; uint64_t *result_elements; uint64_t discard_low; uint64_t discard_high; uint64_t discard_temp_low; uint64_t discard_temp_high; /* Zero result */ memset ( result, 0, sizeof ( *result ) ); /* Multiply integers one element at a time */ for ( i = 0 ; i < size ; i++ ) { multiplicand_element = multiplicand->element[i]; for ( j = 0 ; j < size ; j++ ) { multiplier_element = multiplier->element[j]; result_elements = &result->element[ i + j ]; /* Perform a single multiply, and add the * resulting double-element into the result, * carrying as necessary. The carry can * never overflow beyond the end of the * result, since: * * a < 2^{n}, b < 2^{n} => ab < 2^{2n} */ __asm__ __volatile__ ( "mul.d %1, %6, %7\n\t" "mulh.du %2, %6, %7\n\t" "ld.d %3, %0, 0\n\t" "ld.d %4, %0, 8\n\t" "add.d %3, %3, %1\n\t" "sltu $t0, %3, %1\n\t" "add.d %4, %4, %2\n\t" "sltu $t1, %4, %2\n\t" "add.d %4, %4, $t0\n\t" "sltu $t0, %4, $t0\n\t" "or $t0, $t0, $t1\n\t" "st.d %3, %0, 0\n\t" "st.d %4, %0, 8\n\t" "addi.d %0, %0, 16\n\t" "beqz $t0, 2f\n" "1:\n\t" "ld.d %3, %0, 0\n\t" "add.d %3, %3, $t0\n\t" "sltu $t0, %3, $t0\n\t" "st.d %3, %0, 0\n\t" "addi.d %0, %0, 8\n\t" "bnez $t0, 1b\n" "2:" : "+r" ( result_elements ), "=&r" ( discard_low ), "=&r" ( discard_high ), "=r" ( discard_temp_low ), "=r" ( discard_temp_high ), "+m" ( *result ) : "r" ( multiplicand_element ), "r" ( multiplier_element ) : "t0", "t1" ); } } }