addmul_1.S source code [glibc/sysdeps/sparc/sparc64/addmul_1.S]

1	/ SPARC v9 __mpn_addmul_1 -- Multiply a limb vector with a single limb and*
2	add the product to a second limb vector.
3
4	Copyright (C) 1996-2024 Free Software Foundation, Inc.
5
6	This file is part of the GNU MP Library.
7
8	The GNU MP Library is free software; you can redistribute it and/or modify
9	it under the terms of the GNU Lesser General Public License as published by
10	the Free Software Foundation; either version 2.1 of the License, or (at your
11	option) any later version.
12
13	The GNU MP Library is distributed in the hope that it will be useful, but
14	WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
15	or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
16	License for more details.
17
18	You should have received a copy of the GNU Lesser General Public License
19	along with the GNU MP Library; see the file COPYING.LIB. If not,
20	see <https://www.gnu.org/licenses/>. /*
21
22	#include <sysdep.h>
23
24
25	/ INPUT PARAMETERS*
26	res_ptr o0
27	s1_ptr o1
28	size o2
29	s2_limb o3 /*
30
31
32	ENTRY(__mpn_addmul_1)
33	save %sp,-`192`,%sp
34
35	sub %g0,%i2,%o7
36	mov `0`,%o0 ! zero cy_limb
37	sllx %o7,`3`,%o7
38	sethi %hi(`0x80000000`),%o2
39	srl %i3,`0`,%o1 ! extract low `32` bits of s2_limb
40	sub %i1,%o7,%o3
41	srlx %i3,`32`,%i3 ! extract high `32` bits of s2_limb
42	sub %i0,%o7,%o4
43	add %o2,%o2,%o2 ! o2 = `0x100000000`
44
45	! hi !
46	! mid-`1` !
47	! mid-`2` !
48	! lo !
49	`1`:
50	ldx [%o3+%o7],%g5
51	srl %g5,`0`,%i0 ! zero hi bits
52	ldx [%o4+%o7],%l1
53	srlx %g5,`32`,%g5
54	mulx %o1,%i0,%i4 ! lo product
55	mulx %i3,%i0,%i1 ! mid-`1` product
56	mulx %o1,%g5,%l2 ! mid-`2` product
57	mulx %i3,%g5,%i5 ! hi product
58	srlx %i4,`32`,%i0 ! extract high `32` bits of lo product...
59	add %i1,%i0,%i1 ! ...and add it to the mid-`1` product
60	addcc %i1,%l2,%i1 ! add mid products
61	mov `0`,%l0 ! we need the carry from that add...
62	movcs %xcc,%o2,%l0 ! ...compute it and...
63	sllx %i1,`32`,%i0 ! align low bits of mid product
64	add %i5,%l0,%i5 ! ...add to bit `32` of the hi product
65	srl %i4,`0`,%g5 ! zero high `32` bits of lo product
66	add %i0,%g5,%i0 ! combine into low `64` bits of result
67	srlx %i1,`32`,%i1 ! extract high bits of mid product...
68	addcc %i0,%o0,%i0 ! add cy_limb to low `64` bits of result
69	add %i5,%i1,%i1 ! ...and add them to the high result
70	mov `0`,%g5
71	movcs %xcc,`1`,%g5
72	addcc %l1,%i0,%i0
73	stx %i0,[%o4+%o7]
74	add %g5,`1`,%l1
75	movcs %xcc,%l1,%g5
76	addcc %o7,`8`,%o7
77	bne,pt %xcc,`1b`
78	add %i1,%g5,%o0 ! compute new cy_limb
79
80	jmpl %i7+`8`, %g0
81	restore %o0,%g0,%o0
82
83	END(__mpn_addmul_1)
84

source code of glibc/sysdeps/sparc/sparc64/addmul_1.S