1/* SPARC v9 __mpn_addmul_1 -- Multiply a limb vector with a single limb and 2 add the product to a second limb vector. 3 4 Copyright (C) 1996-2022 Free Software Foundation, Inc. 5 6 This file is part of the GNU MP Library. 7 8 The GNU MP Library is free software; you can redistribute it and/or modify 9 it under the terms of the GNU Lesser General Public License as published by 10 the Free Software Foundation; either version 2.1 of the License, or (at your 11 option) any later version. 12 13 The GNU MP Library is distributed in the hope that it will be useful, but 14 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 15 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public 16 License for more details. 17 18 You should have received a copy of the GNU Lesser General Public License 19 along with the GNU MP Library; see the file COPYING.LIB. If not, 20 see <https://www.gnu.org/licenses/>. */ 21 22#include <sysdep.h> 23 24 25/* INPUT PARAMETERS 26 res_ptr o0 27 s1_ptr o1 28 size o2 29 s2_limb o3 */ 30 31 32ENTRY(__mpn_addmul_1) 33 save %sp,-192,%sp 34 35 sub %g0,%i2,%o7 36 mov 0,%o0 ! zero cy_limb 37 sllx %o7,3,%o7 38 sethi %hi(0x80000000),%o2 39 srl %i3,0,%o1 ! extract low 32 bits of s2_limb 40 sub %i1,%o7,%o3 41 srlx %i3,32,%i3 ! extract high 32 bits of s2_limb 42 sub %i0,%o7,%o4 43 add %o2,%o2,%o2 ! o2 = 0x100000000 44 45 ! hi ! 46 ! mid-1 ! 47 ! mid-2 ! 48 ! lo ! 491: 50 ldx [%o3+%o7],%g5 51 srl %g5,0,%i0 ! zero hi bits 52 ldx [%o4+%o7],%l1 53 srlx %g5,32,%g5 54 mulx %o1,%i0,%i4 ! lo product 55 mulx %i3,%i0,%i1 ! mid-1 product 56 mulx %o1,%g5,%l2 ! mid-2 product 57 mulx %i3,%g5,%i5 ! hi product 58 srlx %i4,32,%i0 ! extract high 32 bits of lo product... 59 add %i1,%i0,%i1 ! ...and add it to the mid-1 product 60 addcc %i1,%l2,%i1 ! add mid products 61 mov 0,%l0 ! we need the carry from that add... 62 movcs %xcc,%o2,%l0 ! ...compute it and... 63 sllx %i1,32,%i0 ! align low bits of mid product 64 add %i5,%l0,%i5 ! ...add to bit 32 of the hi product 65 srl %i4,0,%g5 ! zero high 32 bits of lo product 66 add %i0,%g5,%i0 ! combine into low 64 bits of result 67 srlx %i1,32,%i1 ! extract high bits of mid product... 68 addcc %i0,%o0,%i0 ! add cy_limb to low 64 bits of result 69 add %i5,%i1,%i1 ! ...and add them to the high result 70 mov 0,%g5 71 movcs %xcc,1,%g5 72 addcc %l1,%i0,%i0 73 stx %i0,[%o4+%o7] 74 add %g5,1,%l1 75 movcs %xcc,%l1,%g5 76 addcc %o7,8,%o7 77 bne,pt %xcc,1b 78 add %i1,%g5,%o0 ! compute new cy_limb 79 80 jmpl %i7+8, %g0 81 restore %o0,%g0,%o0 82 83END(__mpn_addmul_1) 84