xref: /openbsd/lib/libcrypto/bn/arch/amd64/bn_arch.h (revision 739ee6ab)
1*739ee6abSjsing /*	$OpenBSD: bn_arch.h,v 1.14 2024/03/26 06:09:25 jsing Exp $ */
25c83b098Sjsing /*
35c83b098Sjsing  * Copyright (c) 2023 Joel Sing <jsing@openbsd.org>
45c83b098Sjsing  *
55c83b098Sjsing  * Permission to use, copy, modify, and distribute this software for any
65c83b098Sjsing  * purpose with or without fee is hereby granted, provided that the above
75c83b098Sjsing  * copyright notice and this permission notice appear in all copies.
85c83b098Sjsing  *
95c83b098Sjsing  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
105c83b098Sjsing  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
115c83b098Sjsing  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
125c83b098Sjsing  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
135c83b098Sjsing  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
145c83b098Sjsing  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
155c83b098Sjsing  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
165c83b098Sjsing  */
175c83b098Sjsing 
18519d53cbSjsing #include <openssl/bn.h>
19519d53cbSjsing 
205c83b098Sjsing #ifndef HEADER_BN_ARCH_H
215c83b098Sjsing #define HEADER_BN_ARCH_H
225c83b098Sjsing 
235c83b098Sjsing #ifndef OPENSSL_NO_ASM
245c83b098Sjsing 
2537c49545Sjsing #define HAVE_BN_ADD
267069ede1Sjsing #define HAVE_BN_ADD_WORDS
277069ede1Sjsing 
282c5f73faSjsing #define HAVE_BN_DIV_WORDS
292c5f73faSjsing 
308889fb99Sjsing #define HAVE_BN_MUL_ADD_WORDS
31de344ea3Sjsing #define HAVE_BN_MUL_COMBA4
32de344ea3Sjsing #define HAVE_BN_MUL_COMBA8
338889fb99Sjsing #define HAVE_BN_MUL_WORDS
34de344ea3Sjsing 
3550b4e57eSjsing #define HAVE_BN_SQR
36de344ea3Sjsing #define HAVE_BN_SQR_COMBA4
37de344ea3Sjsing #define HAVE_BN_SQR_COMBA8
38de344ea3Sjsing 
3937c49545Sjsing #define HAVE_BN_SUB
407069ede1Sjsing #define HAVE_BN_SUB_WORDS
417069ede1Sjsing 
42e9b52428Sjsing #define HAVE_BN_WORD_CLZ
43e9b52428Sjsing 
44519d53cbSjsing #if defined(__GNUC__)
45*739ee6abSjsing 
46519d53cbSjsing #define HAVE_BN_DIV_REM_WORDS_INLINE
47519d53cbSjsing 
48519d53cbSjsing static inline void
bn_div_rem_words_inline(BN_ULONG h,BN_ULONG l,BN_ULONG d,BN_ULONG * out_q,BN_ULONG * out_r)49519d53cbSjsing bn_div_rem_words_inline(BN_ULONG h, BN_ULONG l, BN_ULONG d, BN_ULONG *out_q,
50519d53cbSjsing     BN_ULONG *out_r)
51519d53cbSjsing {
52519d53cbSjsing 	BN_ULONG q, r;
53519d53cbSjsing 
54519d53cbSjsing 	/*
55519d53cbSjsing 	 * Unsigned division of %rdx:%rax by d with quotient being stored in
56519d53cbSjsing 	 * %rax and remainder in %rdx.
57519d53cbSjsing 	 */
58519d53cbSjsing 	__asm__ volatile ("divq %4"
59519d53cbSjsing 	    : "=a"(q), "=d"(r)
60519d53cbSjsing 	    : "d"(h), "a"(l), "rm"(d)
61519d53cbSjsing 	    : "cc");
62519d53cbSjsing 
63519d53cbSjsing 	*out_q = q;
64519d53cbSjsing 	*out_r = r;
65519d53cbSjsing }
66519d53cbSjsing 
6782c46216Sjsing #define HAVE_BN_MULW
680db1114fSjsing 
690db1114fSjsing static inline void
bn_mulw(BN_ULONG a,BN_ULONG b,BN_ULONG * out_r1,BN_ULONG * out_r0)7082c46216Sjsing bn_mulw(BN_ULONG a, BN_ULONG b, BN_ULONG *out_r1, BN_ULONG *out_r0)
710db1114fSjsing {
7282c46216Sjsing 	BN_ULONG r1, r0;
730db1114fSjsing 
740db1114fSjsing 	/*
750db1114fSjsing 	 * Unsigned multiplication of %rax, with the double word result being
760db1114fSjsing 	 * stored in %rdx:%rax.
770db1114fSjsing 	 */
780db1114fSjsing 	__asm__ ("mulq %3"
7982c46216Sjsing 	    : "=d"(r1), "=a"(r0)
800db1114fSjsing 	    : "a"(a), "rm"(b)
810db1114fSjsing 	    : "cc");
820db1114fSjsing 
8382c46216Sjsing 	*out_r1 = r1;
8482c46216Sjsing 	*out_r0 = r0;
850db1114fSjsing }
86*739ee6abSjsing 
87*739ee6abSjsing #define HAVE_BN_SUBW
88*739ee6abSjsing 
89*739ee6abSjsing static inline void
bn_subw(BN_ULONG a,BN_ULONG b,BN_ULONG * out_borrow,BN_ULONG * out_r0)90*739ee6abSjsing bn_subw(BN_ULONG a, BN_ULONG b, BN_ULONG *out_borrow, BN_ULONG *out_r0)
91*739ee6abSjsing {
92*739ee6abSjsing 	BN_ULONG borrow, r0;
93*739ee6abSjsing 
94*739ee6abSjsing 	__asm__ (
95*739ee6abSjsing 	    "subq   %3, %1 \n"
96*739ee6abSjsing 	    "setb   %b0 \n"
97*739ee6abSjsing 	    "and    $1, %0 \n"
98*739ee6abSjsing 	    : "=r"(borrow), "=r"(r0)
99*739ee6abSjsing 	    : "1"(a), "rm"(b)
100*739ee6abSjsing 	    : "cc");
101*739ee6abSjsing 
102*739ee6abSjsing 	*out_borrow = borrow;
103*739ee6abSjsing 	*out_r0 = r0;
104*739ee6abSjsing }
105*739ee6abSjsing 
1060db1114fSjsing #endif /* __GNUC__ */
1070db1114fSjsing 
1085c83b098Sjsing #endif
1095c83b098Sjsing #endif
110