1*739ee6abSjsing /* $OpenBSD: bn_arch.h,v 1.14 2024/03/26 06:09:25 jsing Exp $ */
25c83b098Sjsing /*
35c83b098Sjsing * Copyright (c) 2023 Joel Sing <jsing@openbsd.org>
45c83b098Sjsing *
55c83b098Sjsing * Permission to use, copy, modify, and distribute this software for any
65c83b098Sjsing * purpose with or without fee is hereby granted, provided that the above
75c83b098Sjsing * copyright notice and this permission notice appear in all copies.
85c83b098Sjsing *
95c83b098Sjsing * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
105c83b098Sjsing * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
115c83b098Sjsing * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
125c83b098Sjsing * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
135c83b098Sjsing * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
145c83b098Sjsing * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
155c83b098Sjsing * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
165c83b098Sjsing */
175c83b098Sjsing
18519d53cbSjsing #include <openssl/bn.h>
19519d53cbSjsing
205c83b098Sjsing #ifndef HEADER_BN_ARCH_H
215c83b098Sjsing #define HEADER_BN_ARCH_H
225c83b098Sjsing
235c83b098Sjsing #ifndef OPENSSL_NO_ASM
245c83b098Sjsing
2537c49545Sjsing #define HAVE_BN_ADD
267069ede1Sjsing #define HAVE_BN_ADD_WORDS
277069ede1Sjsing
282c5f73faSjsing #define HAVE_BN_DIV_WORDS
292c5f73faSjsing
308889fb99Sjsing #define HAVE_BN_MUL_ADD_WORDS
31de344ea3Sjsing #define HAVE_BN_MUL_COMBA4
32de344ea3Sjsing #define HAVE_BN_MUL_COMBA8
338889fb99Sjsing #define HAVE_BN_MUL_WORDS
34de344ea3Sjsing
3550b4e57eSjsing #define HAVE_BN_SQR
36de344ea3Sjsing #define HAVE_BN_SQR_COMBA4
37de344ea3Sjsing #define HAVE_BN_SQR_COMBA8
38de344ea3Sjsing
3937c49545Sjsing #define HAVE_BN_SUB
407069ede1Sjsing #define HAVE_BN_SUB_WORDS
417069ede1Sjsing
42e9b52428Sjsing #define HAVE_BN_WORD_CLZ
43e9b52428Sjsing
44519d53cbSjsing #if defined(__GNUC__)
45*739ee6abSjsing
46519d53cbSjsing #define HAVE_BN_DIV_REM_WORDS_INLINE
47519d53cbSjsing
48519d53cbSjsing static inline void
bn_div_rem_words_inline(BN_ULONG h,BN_ULONG l,BN_ULONG d,BN_ULONG * out_q,BN_ULONG * out_r)49519d53cbSjsing bn_div_rem_words_inline(BN_ULONG h, BN_ULONG l, BN_ULONG d, BN_ULONG *out_q,
50519d53cbSjsing BN_ULONG *out_r)
51519d53cbSjsing {
52519d53cbSjsing BN_ULONG q, r;
53519d53cbSjsing
54519d53cbSjsing /*
55519d53cbSjsing * Unsigned division of %rdx:%rax by d with quotient being stored in
56519d53cbSjsing * %rax and remainder in %rdx.
57519d53cbSjsing */
58519d53cbSjsing __asm__ volatile ("divq %4"
59519d53cbSjsing : "=a"(q), "=d"(r)
60519d53cbSjsing : "d"(h), "a"(l), "rm"(d)
61519d53cbSjsing : "cc");
62519d53cbSjsing
63519d53cbSjsing *out_q = q;
64519d53cbSjsing *out_r = r;
65519d53cbSjsing }
66519d53cbSjsing
6782c46216Sjsing #define HAVE_BN_MULW
680db1114fSjsing
690db1114fSjsing static inline void
bn_mulw(BN_ULONG a,BN_ULONG b,BN_ULONG * out_r1,BN_ULONG * out_r0)7082c46216Sjsing bn_mulw(BN_ULONG a, BN_ULONG b, BN_ULONG *out_r1, BN_ULONG *out_r0)
710db1114fSjsing {
7282c46216Sjsing BN_ULONG r1, r0;
730db1114fSjsing
740db1114fSjsing /*
750db1114fSjsing * Unsigned multiplication of %rax, with the double word result being
760db1114fSjsing * stored in %rdx:%rax.
770db1114fSjsing */
780db1114fSjsing __asm__ ("mulq %3"
7982c46216Sjsing : "=d"(r1), "=a"(r0)
800db1114fSjsing : "a"(a), "rm"(b)
810db1114fSjsing : "cc");
820db1114fSjsing
8382c46216Sjsing *out_r1 = r1;
8482c46216Sjsing *out_r0 = r0;
850db1114fSjsing }
86*739ee6abSjsing
87*739ee6abSjsing #define HAVE_BN_SUBW
88*739ee6abSjsing
89*739ee6abSjsing static inline void
bn_subw(BN_ULONG a,BN_ULONG b,BN_ULONG * out_borrow,BN_ULONG * out_r0)90*739ee6abSjsing bn_subw(BN_ULONG a, BN_ULONG b, BN_ULONG *out_borrow, BN_ULONG *out_r0)
91*739ee6abSjsing {
92*739ee6abSjsing BN_ULONG borrow, r0;
93*739ee6abSjsing
94*739ee6abSjsing __asm__ (
95*739ee6abSjsing "subq %3, %1 \n"
96*739ee6abSjsing "setb %b0 \n"
97*739ee6abSjsing "and $1, %0 \n"
98*739ee6abSjsing : "=r"(borrow), "=r"(r0)
99*739ee6abSjsing : "1"(a), "rm"(b)
100*739ee6abSjsing : "cc");
101*739ee6abSjsing
102*739ee6abSjsing *out_borrow = borrow;
103*739ee6abSjsing *out_r0 = r0;
104*739ee6abSjsing }
105*739ee6abSjsing
1060db1114fSjsing #endif /* __GNUC__ */
1070db1114fSjsing
1085c83b098Sjsing #endif
1095c83b098Sjsing #endif
110