libgpuverify

Signature verification on GPUs (WiP)
Log | Files | Refs | README | LICENSE

commit 8b93b6635c36c5a5c3902af59bc0e614628b009d
parent f8cbe4d8d06f4be7d5d02a280492f7b34a9167d0
Author: Cedric <cedric.zwahlen@students.bfh.ch>
Date:   Sat, 23 Dec 2023 18:47:57 +0100

Fix Montgomery

Though far from usable still, some progress is being made

Diffstat:
M.DS_Store | 0
Msource/.DS_Store | 0
Msource/Makefile | 2+-
Msource/gmp.c | 1432+++++++++++++++++++++++++++++++++++++++----------------------------------------
Asource/gmp.h | 310+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
Msource/lib-gpu-verify.c | 7++++---
Msource/montgomery-test.c | 2+-
Msource/montgomery.h | 2+-
Msource/montmodmult.c | 616+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
Msource/montmodmult.h | 7+++++++
Msource/rsa-test.c | 2+-
Msource/rsa-test.h | 35-----------------------------------
Msource/util.h | 62++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
Mxcode/.DS_Store | 0
Mxcode/lib-gpu-generate/msgsig.txt | 4++--
Mxcode/lib-gpu-generate/publickey.txt | 4++--
Mxcode/lib-gpu-verify.xcodeproj/project.pbxproj | 38++++++++++++++++++++++++++++++--------
Mxcode/lib-gpu-verify.xcodeproj/project.xcworkspace/xcuserdata/cedriczwahlen.xcuserdatad/UserInterfaceState.xcuserstate | 0
Mxcode/lib-gpu-verify.xcodeproj/xcuserdata/cedriczwahlen.xcuserdatad/xcdebugger/Breakpoints_v2.xcbkptlist | 1501+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
Mxcode/montmodmult.cl | 375+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
Mxcode/verify.cl | 9+++++----
21 files changed, 3626 insertions(+), 782 deletions(-)

diff --git a/.DS_Store b/.DS_Store Binary files differ. diff --git a/source/.DS_Store b/source/.DS_Store Binary files differ. diff --git a/source/Makefile b/source/Makefile @@ -1,3 +1,3 @@ all: - gcc -g -O0 -D CL_TARGET_OPENCL_VERSION=100 -o gpu-verify lib-gpu-verify.c rsa-test.c montgomery-test.c reference-test.c util.c gmp.c -lgcrypt -lOpenCL -lm + gcc -g -O0 -D CL_TARGET_OPENCL_VERSION=100 -o gpu-verify lib-gpu-verify.c rsa-test.c montgomery-test.c reference-test.c util.c gmp.c -lgcrypt -lgmp -lOpenCL -lm diff --git a/source/gmp.c b/source/gmp.c @@ -1,7 +1,3 @@ -#include "gmp.h" - - - /* mini-gmp, a minimalistic implementation of a GNU GMP subset. Contributed to the GNU project by Niels Möller @@ -53,7 +49,7 @@ see https://www.gnu.org/licenses/. */ #include <stdlib.h> #include <string.h> -//#include "mini-gmp.h" +#include "gmp.h" #if !defined(MINI_GMP_DONT_USE_FLOAT_H) #include <float.h> @@ -61,7 +57,24 @@ see https://www.gnu.org/licenses/. */ /* Macros */ +#define GMP_LIMB_BITS (sizeof(mp_limb_t) * CHAR_BIT) + +#define GMP_LIMB_MAX ((mp_limb_t) ~ (mp_limb_t) 0) +#define GMP_LIMB_HIGHBIT ((mp_limb_t) 1 << (GMP_LIMB_BITS - 1)) + +#define GMP_HLIMB_BIT ((mp_limb_t) 1 << (GMP_LIMB_BITS / 2)) +#define GMP_LLIMB_MASK (GMP_HLIMB_BIT - 1) +#define GMP_ULONG_BITS (sizeof(unsigned long) * CHAR_BIT) +#define GMP_ULONG_HIGHBIT ((unsigned long) 1 << (GMP_ULONG_BITS - 1)) + +#define GMP_ABS(x) ((x) >= 0 ? (x) : -(x)) +#define GMP_NEG_CAST(T,x) (-((T)((x) + 1) - 1)) + +#define GMP_MIN(a, b) ((a) < (b) ? (a) : (b)) +#define GMP_MAX(a, b) ((a) > (b) ? (a) : (b)) + +#define GMP_CMP(a,b) (((a) > (b)) - ((a) < (b))) #if defined(DBL_MANT_DIG) && FLT_RADIX == 2 #define GMP_DBL_MANT_BITS DBL_MANT_DIG @@ -72,91 +85,91 @@ see https://www.gnu.org/licenses/. */ /* Return non-zero if xp,xsize and yp,ysize overlap. If xp+xsize<=yp there's no overlap, or if yp+ysize<=xp there's no overlap. If both these are false, there's an overlap. */ -#define GMP_MPN_OVERLAP_P(xp, xsize, yp, ysize) \ +#define GMP_MPN_OVERLAP_P(xp, xsize, yp, ysize) \ ((xp) + (xsize) > (yp) && (yp) + (ysize) > (xp)) #define gmp_assert_nocarry(x) do { \ - mp_limb_t __cy = (x); \ - assert (__cy == 0); \ - (void) (__cy); \ + mp_limb_t __cy = (x); \ + assert (__cy == 0); \ + (void) (__cy); \ } while (0) -#define gmp_clz(count, x) do { \ - mp_limb_t __clz_x = (x); \ - unsigned __clz_c = 0; \ - int LOCAL_SHIFT_BITS = 8; \ - if (GMP_LIMB_BITS > LOCAL_SHIFT_BITS) \ - for (; \ - (__clz_x & ((mp_limb_t) 0xff << (GMP_LIMB_BITS - 8))) == 0; \ - __clz_c += 8) \ - { __clz_x <<= LOCAL_SHIFT_BITS; } \ - for (; (__clz_x & GMP_LIMB_HIGHBIT) == 0; __clz_c++) \ - __clz_x <<= 1; \ - (count) = __clz_c; \ +#define gmp_clz(count, x) do { \ + mp_limb_t __clz_x = (x); \ + unsigned __clz_c = 0; \ + int LOCAL_SHIFT_BITS = 8; \ + if (GMP_LIMB_BITS > LOCAL_SHIFT_BITS) \ + for (; \ + (__clz_x & ((mp_limb_t) 0xff << (GMP_LIMB_BITS - 8))) == 0; \ + __clz_c += 8) \ + { __clz_x <<= LOCAL_SHIFT_BITS; } \ + for (; (__clz_x & GMP_LIMB_HIGHBIT) == 0; __clz_c++) \ + __clz_x <<= 1; \ + (count) = __clz_c; \ } while (0) -#define gmp_ctz(count, x) do { \ - mp_limb_t __ctz_x = (x); \ - unsigned __ctz_c = 0; \ - gmp_clz (__ctz_c, __ctz_x & - __ctz_x); \ - (count) = GMP_LIMB_BITS - 1 - __ctz_c; \ +#define gmp_ctz(count, x) do { \ + mp_limb_t __ctz_x = (x); \ + unsigned __ctz_c = 0; \ + gmp_clz (__ctz_c, __ctz_x & - __ctz_x); \ + (count) = GMP_LIMB_BITS - 1 - __ctz_c; \ } while (0) #define gmp_add_ssaaaa(sh, sl, ah, al, bh, bl) \ - do { \ - mp_limb_t __x; \ - __x = (al) + (bl); \ - (sh) = (ah) + (bh) + (__x < (al)); \ - (sl) = __x; \ + do { \ + mp_limb_t __x; \ + __x = (al) + (bl); \ + (sh) = (ah) + (bh) + (__x < (al)); \ + (sl) = __x; \ } while (0) #define gmp_sub_ddmmss(sh, sl, ah, al, bh, bl) \ - do { \ - mp_limb_t __x; \ - __x = (al) - (bl); \ - (sh) = (ah) - (bh) - ((al) < (bl)); \ - (sl) = __x; \ + do { \ + mp_limb_t __x; \ + __x = (al) - (bl); \ + (sh) = (ah) - (bh) - ((al) < (bl)); \ + (sl) = __x; \ } while (0) -#define gmp_umul_ppmm(w1, w0, u, v) \ - do { \ - int LOCAL_GMP_LIMB_BITS = GMP_LIMB_BITS; \ - if (sizeof(unsigned int) * CHAR_BIT >= 2 * GMP_LIMB_BITS) \ - { \ - unsigned int __ww = (unsigned int) (u) * (v); \ - w0 = (mp_limb_t) __ww; \ - w1 = (mp_limb_t) (__ww >> LOCAL_GMP_LIMB_BITS); \ - } \ - else if (GMP_ULONG_BITS >= 2 * GMP_LIMB_BITS) \ - { \ - unsigned long int __ww = (unsigned long int) (u) * (v); \ - w0 = (mp_limb_t) __ww; \ - w1 = (mp_limb_t) (__ww >> LOCAL_GMP_LIMB_BITS); \ - } \ - else { \ - mp_limb_t __x0, __x1, __x2, __x3; \ - unsigned __ul, __vl, __uh, __vh; \ - mp_limb_t __u = (u), __v = (v); \ - assert (sizeof (unsigned) * 2 >= sizeof (mp_limb_t)); \ - \ - __ul = __u & GMP_LLIMB_MASK; \ - __uh = __u >> (GMP_LIMB_BITS / 2); \ - __vl = __v & GMP_LLIMB_MASK; \ - __vh = __v >> (GMP_LIMB_BITS / 2); \ - \ - __x0 = (mp_limb_t) __ul * __vl; \ - __x1 = (mp_limb_t) __ul * __vh; \ - __x2 = (mp_limb_t) __uh * __vl; \ - __x3 = (mp_limb_t) __uh * __vh; \ - \ - __x1 += __x0 >> (GMP_LIMB_BITS / 2);/* this can't give carry */ \ - __x1 += __x2; /* but this indeed can */ \ - if (__x1 < __x2) /* did we get it? */ \ - __x3 += GMP_HLIMB_BIT; /* yes, add it in the proper pos. */ \ - \ - (w1) = __x3 + (__x1 >> (GMP_LIMB_BITS / 2)); \ - (w0) = (__x1 << (GMP_LIMB_BITS / 2)) + (__x0 & GMP_LLIMB_MASK); \ - } \ +#define gmp_umul_ppmm(w1, w0, u, v) \ + do { \ + int LOCAL_GMP_LIMB_BITS = GMP_LIMB_BITS; \ + if (sizeof(unsigned int) * CHAR_BIT >= 2 * GMP_LIMB_BITS) \ + { \ + unsigned int __ww = (unsigned int) (u) * (v); \ + w0 = (mp_limb_t) __ww; \ + w1 = (mp_limb_t) (__ww >> LOCAL_GMP_LIMB_BITS); \ + } \ + else if (GMP_ULONG_BITS >= 2 * GMP_LIMB_BITS) \ + { \ + unsigned long int __ww = (unsigned long int) (u) * (v); \ + w0 = (mp_limb_t) __ww; \ + w1 = (mp_limb_t) (__ww >> LOCAL_GMP_LIMB_BITS); \ + } \ + else { \ + mp_limb_t __x0, __x1, __x2, __x3; \ + unsigned __ul, __vl, __uh, __vh; \ + mp_limb_t __u = (u), __v = (v); \ + assert (sizeof (unsigned) * 2 >= sizeof (mp_limb_t)); \ + \ + __ul = __u & GMP_LLIMB_MASK; \ + __uh = __u >> (GMP_LIMB_BITS / 2); \ + __vl = __v & GMP_LLIMB_MASK; \ + __vh = __v >> (GMP_LIMB_BITS / 2); \ + \ + __x0 = (mp_limb_t) __ul * __vl; \ + __x1 = (mp_limb_t) __ul * __vh; \ + __x2 = (mp_limb_t) __uh * __vl; \ + __x3 = (mp_limb_t) __uh * __vh; \ + \ + __x1 += __x0 >> (GMP_LIMB_BITS / 2);/* this can't give carry */ \ + __x1 += __x2; /* but this indeed can */ \ + if (__x1 < __x2) /* did we get it? */ \ + __x3 += GMP_HLIMB_BIT; /* yes, add it in the proper pos. */ \ + \ + (w1) = __x3 + (__x1 >> (GMP_LIMB_BITS / 2)); \ + (w0) = (__x1 << (GMP_LIMB_BITS / 2)) + (__x0 & GMP_LLIMB_MASK); \ + } \ } while (0) /* If mp_limb_t is of size smaller than int, plain u*v implies @@ -166,106 +179,106 @@ see https://www.gnu.org/licenses/. */ #define gmp_umullo_limb(u, v) \ ((sizeof(mp_limb_t) >= sizeof(int)) ? (u)*(v) : (unsigned int)(u) * (v)) -#define gmp_udiv_qrnnd_preinv(q, r, nh, nl, d, di) \ - do { \ - mp_limb_t _qh, _ql, _r, _mask; \ - gmp_umul_ppmm (_qh, _ql, (nh), (di)); \ - gmp_add_ssaaaa (_qh, _ql, _qh, _ql, (nh) + 1, (nl)); \ - _r = (nl) - gmp_umullo_limb (_qh, (d)); \ - _mask = -(mp_limb_t) (_r > _ql); /* both > and >= are OK */ \ - _qh += _mask; \ - _r += _mask & (d); \ - if (_r >= (d)) \ - { \ - _r -= (d); \ - _qh++; \ - } \ - \ - (r) = _r; \ - (q) = _qh; \ +#define gmp_udiv_qrnnd_preinv(q, r, nh, nl, d, di) \ + do { \ + mp_limb_t _qh, _ql, _r, _mask; \ + gmp_umul_ppmm (_qh, _ql, (nh), (di)); \ + gmp_add_ssaaaa (_qh, _ql, _qh, _ql, (nh) + 1, (nl)); \ + _r = (nl) - gmp_umullo_limb (_qh, (d)); \ + _mask = -(mp_limb_t) (_r > _ql); /* both > and >= are OK */ \ + _qh += _mask; \ + _r += _mask & (d); \ + if (_r >= (d)) \ + { \ + _r -= (d); \ + _qh++; \ + } \ + \ + (r) = _r; \ + (q) = _qh; \ } while (0) -#define gmp_udiv_qr_3by2(q, r1, r0, n2, n1, n0, d1, d0, dinv) \ - do { \ - mp_limb_t _q0, _t1, _t0, _mask; \ - gmp_umul_ppmm ((q), _q0, (n2), (dinv)); \ - gmp_add_ssaaaa ((q), _q0, (q), _q0, (n2), (n1)); \ - \ - /* Compute the two most significant limbs of n - q'd */ \ - (r1) = (n1) - gmp_umullo_limb ((d1), (q)); \ - gmp_sub_ddmmss ((r1), (r0), (r1), (n0), (d1), (d0)); \ - gmp_umul_ppmm (_t1, _t0, (d0), (q)); \ - gmp_sub_ddmmss ((r1), (r0), (r1), (r0), _t1, _t0); \ - (q)++; \ - \ - /* Conditionally adjust q and the remainders */ \ - _mask = - (mp_limb_t) ((r1) >= _q0); \ - (q) += _mask; \ +#define gmp_udiv_qr_3by2(q, r1, r0, n2, n1, n0, d1, d0, dinv) \ + do { \ + mp_limb_t _q0, _t1, _t0, _mask; \ + gmp_umul_ppmm ((q), _q0, (n2), (dinv)); \ + gmp_add_ssaaaa ((q), _q0, (q), _q0, (n2), (n1)); \ + \ + /* Compute the two most significant limbs of n - q'd */ \ + (r1) = (n1) - gmp_umullo_limb ((d1), (q)); \ + gmp_sub_ddmmss ((r1), (r0), (r1), (n0), (d1), (d0)); \ + gmp_umul_ppmm (_t1, _t0, (d0), (q)); \ + gmp_sub_ddmmss ((r1), (r0), (r1), (r0), _t1, _t0); \ + (q)++; \ + \ + /* Conditionally adjust q and the remainders */ \ + _mask = - (mp_limb_t) ((r1) >= _q0); \ + (q) += _mask; \ gmp_add_ssaaaa ((r1), (r0), (r1), (r0), _mask & (d1), _mask & (d0)); \ - if ((r1) >= (d1)) \ - { \ - if ((r1) > (d1) || (r0) >= (d0)) \ - { \ - (q)++; \ - gmp_sub_ddmmss ((r1), (r0), (r1), (r0), (d1), (d0)); \ - } \ - } \ + if ((r1) >= (d1)) \ + { \ + if ((r1) > (d1) || (r0) >= (d0)) \ + { \ + (q)++; \ + gmp_sub_ddmmss ((r1), (r0), (r1), (r0), (d1), (d0)); \ + } \ + } \ } while (0) /* Swap macros. */ -#define MP_LIMB_T_SWAP(x, y) \ - do { \ - mp_limb_t __mp_limb_t_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mp_limb_t_swap__tmp; \ +#define MP_LIMB_T_SWAP(x, y) \ + do { \ + mp_limb_t __mp_limb_t_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mp_limb_t_swap__tmp; \ } while (0) -#define MP_SIZE_T_SWAP(x, y) \ - do { \ - mp_size_t __mp_size_t_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mp_size_t_swap__tmp; \ +#define MP_SIZE_T_SWAP(x, y) \ + do { \ + mp_size_t __mp_size_t_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mp_size_t_swap__tmp; \ } while (0) -#define MP_BITCNT_T_SWAP(x,y) \ - do { \ - mp_bitcnt_t __mp_bitcnt_t_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mp_bitcnt_t_swap__tmp; \ +#define MP_BITCNT_T_SWAP(x,y) \ + do { \ + mp_bitcnt_t __mp_bitcnt_t_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mp_bitcnt_t_swap__tmp; \ } while (0) -#define MP_PTR_SWAP(x, y) \ - do { \ - mp_ptr __mp_ptr_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mp_ptr_swap__tmp; \ +#define MP_PTR_SWAP(x, y) \ + do { \ + mp_ptr __mp_ptr_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mp_ptr_swap__tmp; \ } while (0) -#define MP_SRCPTR_SWAP(x, y) \ - do { \ - mp_srcptr __mp_srcptr_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mp_srcptr_swap__tmp; \ +#define MP_SRCPTR_SWAP(x, y) \ + do { \ + mp_srcptr __mp_srcptr_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mp_srcptr_swap__tmp; \ } while (0) -#define MPN_PTR_SWAP(xp,xs, yp,ys) \ - do { \ - MP_PTR_SWAP (xp, yp); \ - MP_SIZE_T_SWAP (xs, ys); \ +#define MPN_PTR_SWAP(xp,xs, yp,ys) \ + do { \ + MP_PTR_SWAP (xp, yp); \ + MP_SIZE_T_SWAP (xs, ys); \ } while(0) -#define MPN_SRCPTR_SWAP(xp,xs, yp,ys) \ - do { \ - MP_SRCPTR_SWAP (xp, yp); \ - MP_SIZE_T_SWAP (xs, ys); \ +#define MPN_SRCPTR_SWAP(xp,xs, yp,ys) \ + do { \ + MP_SRCPTR_SWAP (xp, yp); \ + MP_SIZE_T_SWAP (xs, ys); \ } while(0) -#define MPZ_PTR_SWAP(x, y) \ - do { \ - mpz_ptr __mpz_ptr_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mpz_ptr_swap__tmp; \ +#define MPZ_PTR_SWAP(x, y) \ + do { \ + mpz_ptr __mpz_ptr_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mpz_ptr_swap__tmp; \ } while (0) -#define MPZ_SRCPTR_SWAP(x, y) \ - do { \ - mpz_srcptr __mpz_srcptr_swap__tmp = (x); \ - (x) = (y); \ - (y) = __mpz_srcptr_swap__tmp; \ +#define MPZ_SRCPTR_SWAP(x, y) \ + do { \ + mpz_srcptr __mpz_srcptr_swap__tmp = (x); \ + (x) = (y); \ + (y) = __mpz_srcptr_swap__tmp; \ } while (0) const int mp_bits_per_limb = GMP_LIMB_BITS; @@ -309,7 +322,7 @@ gmp_default_realloc (void *old, size_t unused_old_size, size_t new_size) static void gmp_default_free (void *p, size_t unused_size) { - //free (p); + free (p); } static void * (*gmp_allocate_func) (size_t) = gmp_default_alloc; @@ -318,8 +331,8 @@ static void (*gmp_free_func) (void *, size_t) = gmp_default_free; void mp_get_memory_functions (void *(**alloc_func) (size_t), - void *(**realloc_func) (void *, size_t, size_t), - void (**free_func) (void *, size_t)) + void *(**realloc_func) (void *, size_t, size_t), + void (**free_func) (void *, size_t)) { if (alloc_func) *alloc_func = gmp_allocate_func; @@ -333,8 +346,8 @@ mp_get_memory_functions (void *(**alloc_func) (size_t), void mp_set_memory_functions (void *(*alloc_func) (size_t), - void *(*realloc_func) (void *, size_t, size_t), - void (*free_func) (void *, size_t)) + void *(*realloc_func) (void *, size_t, size_t), + void (*free_func) (void *, size_t)) { if (!alloc_func) alloc_func = gmp_default_alloc; @@ -395,7 +408,7 @@ mpn_cmp (mp_srcptr ap, mp_srcptr bp, mp_size_t n) while (--n >= 0) { if (ap[n] != bp[n]) - return ap[n] > bp[n] ? 1 : -1; + return ap[n] > bp[n] ? 1 : -1; } return 0; } @@ -704,7 +717,7 @@ mpn_rshift (mp_ptr rp, mp_srcptr up, mp_size_t n, unsigned int cnt) static mp_bitcnt_t mpn_common_scan (mp_limb_t limb, mp_size_t i, mp_srcptr up, mp_size_t un, - mp_limb_t ux) + mp_limb_t ux) { unsigned cnt; @@ -715,7 +728,7 @@ mpn_common_scan (mp_limb_t limb, mp_size_t i, mp_srcptr up, mp_size_t un, { i++; if (i == un) - return (ux == 0 ? ~(mp_bitcnt_t) 0 : un * GMP_LIMB_BITS); + return (ux == 0 ? ~(mp_bitcnt_t) 0 : un * GMP_LIMB_BITS); limb = ux ^ up[i]; } gmp_ctz (cnt, limb); @@ -729,7 +742,7 @@ mpn_scan1 (mp_srcptr ptr, mp_bitcnt_t bit) i = bit / GMP_LIMB_BITS; return mpn_common_scan ( ptr[i] & (GMP_LIMB_MAX << (bit % GMP_LIMB_BITS)), - i, ptr, i, 0); + i, ptr, i, 0); } mp_bitcnt_t @@ -739,7 +752,7 @@ mpn_scan0 (mp_srcptr ptr, mp_bitcnt_t bit) i = bit / GMP_LIMB_BITS; return mpn_common_scan (~ptr[i] & (GMP_LIMB_MAX << (bit % GMP_LIMB_BITS)), - i, ptr, i, GMP_LIMB_MAX); + i, ptr, i, GMP_LIMB_MAX); } void @@ -756,7 +769,7 @@ mpn_neg (mp_ptr rp, mp_srcptr up, mp_size_t n) { *rp = 0; if (!--n) - return 0; + return 0; ++up; ++rp; } *rp = - *up; @@ -794,7 +807,7 @@ mpn_invert_3by2 (mp_limb_t u1, mp_limb_t u0) /* Adjust to get a half-limb 3/2 inverse, i.e., we want qh' = floor( (b^3 - 1) / u) - b = floor ((b^3 - b u - 1) / u - = floor( (b (~u) + b-1) / u), + = floor( (b (~u) + b-1) / u), and the remainder @@ -812,14 +825,14 @@ mpn_invert_3by2 (mp_limb_t u1, mp_limb_t u0) /* Adjustment steps taken from udiv_qrnnd_c */ if (r < p) { - qh--; - r += u1; - if (r >= u1) /* i.e. we didn't get carry when adding to r */ - if (r < p) - { - qh--; - r += u1; - } + qh--; + r += u1; + if (r >= u1) /* i.e. we didn't get carry when adding to r */ + if (r < p) + { + qh--; + r += u1; + } } r -= p; @@ -840,14 +853,14 @@ mpn_invert_3by2 (mp_limb_t u1, mp_limb_t u0) if (r >= (GMP_LIMB_MAX & (p << (GMP_LIMB_BITS / 2)))) { - ql--; - r += u1; + ql--; + r += u1; } m = ((mp_limb_t) qh << (GMP_LIMB_BITS / 2)) + ql; if (r >= u1) { - m++; - r -= u1; + m++; + r -= u1; } } @@ -859,22 +872,22 @@ mpn_invert_3by2 (mp_limb_t u1, mp_limb_t u0) r = ~r; r += u0; if (r < u0) - { - m--; - if (r >= u1) - { - m--; - r -= u1; - } - r -= u1; - } + { + m--; + if (r >= u1) + { + m--; + r -= u1; + } + r -= u1; + } gmp_umul_ppmm (th, tl, u0, m); r += th; if (r < th) - { - m--; - m -= ((r > u1) | ((r == u1) & (tl > u0))); - } + { + m--; + m -= ((r > u1) | ((r == u1) & (tl > u0))); + } } return m; @@ -904,7 +917,7 @@ mpn_div_qr_1_invert (struct gmp_div_inverse *inv, mp_limb_t d) static void mpn_div_qr_2_invert (struct gmp_div_inverse *inv, - mp_limb_t d1, mp_limb_t d0) + mp_limb_t d1, mp_limb_t d0) { unsigned shift; @@ -923,7 +936,7 @@ mpn_div_qr_2_invert (struct gmp_div_inverse *inv, static void mpn_div_qr_invert (struct gmp_div_inverse *inv, - mp_srcptr dp, mp_size_t dn) + mp_srcptr dp, mp_size_t dn) { assert (dn > 0); @@ -942,10 +955,10 @@ mpn_div_qr_invert (struct gmp_div_inverse *inv, gmp_clz (shift, d1); inv->shift = shift; if (shift > 0) - { - d1 = (d1 << shift) | (d0 >> (GMP_LIMB_BITS - shift)); - d0 = (d0 << shift) | (dp[dn-3] >> (GMP_LIMB_BITS - shift)); - } + { + d1 = (d1 << shift) | (d0 >> (GMP_LIMB_BITS - shift)); + d0 = (d0 << shift) | (dp[dn-3] >> (GMP_LIMB_BITS - shift)); + } inv->d1 = d1; inv->d0 = d0; inv->di = mpn_invert_3by2 (d1, d0); @@ -956,14 +969,12 @@ mpn_div_qr_invert (struct gmp_div_inverse *inv, the sbpi1_div_* functions. */ static mp_limb_t mpn_div_qr_1_preinv (mp_ptr qp, mp_srcptr np, mp_size_t nn, - const struct gmp_div_inverse *inv) + const struct gmp_div_inverse *inv) { mp_limb_t d, di; mp_limb_t r; mp_ptr tp = NULL; mp_size_t tn = 0; - - if (inv->shift > 0) { @@ -971,11 +982,8 @@ mpn_div_qr_1_preinv (mp_ptr qp, mp_srcptr np, mp_size_t nn, tp = qp; if (!tp) { - - printf("%ld\n",nn); - tn = nn; - // tp = tn->_mp_d; - // tp = gmp_alloc_limbs (tn); + tn = nn; + tp = gmp_alloc_limbs (tn); } r = mpn_lshift (tp, np, nn, inv->shift); np = tp; @@ -991,17 +999,17 @@ mpn_div_qr_1_preinv (mp_ptr qp, mp_srcptr np, mp_size_t nn, gmp_udiv_qrnnd_preinv (q, r, r, np[nn], d, di); if (qp) - qp[nn] = q; + qp[nn] = q; } - //if (tn) {} - // gmp_free_limbs (tp, tn); + if (tn) + gmp_free_limbs (tp, tn); return r >> inv->shift; } static void mpn_div_qr_2_preinv (mp_ptr qp, mp_ptr np, mp_size_t nn, - const struct gmp_div_inverse *inv) + const struct gmp_div_inverse *inv) { unsigned shift; mp_size_t i; @@ -1028,7 +1036,7 @@ mpn_div_qr_2_preinv (mp_ptr qp, mp_ptr np, mp_size_t nn, gmp_udiv_qr_3by2 (q, r1, r0, r1, r0, n0, d1, d0, di); if (qp) - qp[i] = q; + qp[i] = q; } while (--i >= 0); @@ -1045,9 +1053,9 @@ mpn_div_qr_2_preinv (mp_ptr qp, mp_ptr np, mp_size_t nn, static void mpn_div_qr_pi1 (mp_ptr qp, - mp_ptr np, mp_size_t nn, mp_limb_t n1, - mp_srcptr dp, mp_size_t dn, - mp_limb_t dinv) + mp_ptr np, mp_size_t nn, mp_limb_t n1, + mp_srcptr dp, mp_size_t dn, + mp_limb_t dinv) { mp_size_t i; @@ -1074,32 +1082,32 @@ mpn_div_qr_pi1 (mp_ptr qp, mp_limb_t n0 = np[dn-1+i]; if (n1 == d1 && n0 == d0) - { - q = GMP_LIMB_MAX; - mpn_submul_1 (np+i, dp, dn, q); - n1 = np[dn-1+i]; /* update n1, last loop's value will now be invalid */ - } + { + q = GMP_LIMB_MAX; + mpn_submul_1 (np+i, dp, dn, q); + n1 = np[dn-1+i]; /* update n1, last loop's value will now be invalid */ + } else - { - gmp_udiv_qr_3by2 (q, n1, n0, n1, n0, np[dn-2+i], d1, d0, dinv); + { + gmp_udiv_qr_3by2 (q, n1, n0, n1, n0, np[dn-2+i], d1, d0, dinv); - cy = mpn_submul_1 (np + i, dp, dn-2, q); + cy = mpn_submul_1 (np + i, dp, dn-2, q); - cy1 = n0 < cy; - n0 = n0 - cy; - cy = n1 < cy1; - n1 = n1 - cy1; - np[dn-2+i] = n0; + cy1 = n0 < cy; + n0 = n0 - cy; + cy = n1 < cy1; + n1 = n1 - cy1; + np[dn-2+i] = n0; - if (cy != 0) - { - n1 += d1 + mpn_add_n (np + i, np + i, dp, dn - 1); - q--; - } - } + if (cy != 0) + { + n1 += d1 + mpn_add_n (np + i, np + i, dp, dn - 1); + q--; + } + } if (qp) - qp[i] = q; + qp[i] = q; } while (--i >= 0); @@ -1108,8 +1116,8 @@ mpn_div_qr_pi1 (mp_ptr qp, static void mpn_div_qr_preinv (mp_ptr qp, mp_ptr np, mp_size_t nn, - mp_srcptr dp, mp_size_t dn, - const struct gmp_div_inverse *inv) + mp_srcptr dp, mp_size_t dn, + const struct gmp_div_inverse *inv) { assert (dn > 0); assert (nn >= dn); @@ -1129,14 +1137,14 @@ mpn_div_qr_preinv (mp_ptr qp, mp_ptr np, mp_size_t nn, shift = inv->shift; if (shift > 0) - nh = mpn_lshift (np, np, nn, shift); + nh = mpn_lshift (np, np, nn, shift); else - nh = 0; + nh = 0; mpn_div_qr_pi1 (qp, np, nn, nh, dp, dn, inv->di); if (shift > 0) - gmp_assert_nocarry (mpn_rshift (np, np, dn, shift)); + gmp_assert_nocarry (mpn_rshift (np, np, dn, shift)); } } @@ -1157,8 +1165,8 @@ mpn_div_qr (mp_ptr qp, mp_ptr np, mp_size_t nn, mp_srcptr dp, mp_size_t dn) dp = tp; } mpn_div_qr_preinv (qp, np, nn, dp, dn, &inv); - if (tp) {} - //gmp_free_limbs (tp, dn); + if (tp) + gmp_free_limbs (tp, dn); } @@ -1222,7 +1230,7 @@ mpn_get_str_bits (unsigned char *sp, unsigned bits, mp_srcptr up, mp_size_t un) unsigned shift; sn = ((un - 1) * GMP_LIMB_BITS + mpn_limb_size_in_base_2 (up[un-1]) - + bits - 1) / bits; + + bits - 1) / bits; mask = (1U << bits) - 1; @@ -1233,10 +1241,10 @@ mpn_get_str_bits (unsigned char *sp, unsigned bits, mp_srcptr up, mp_size_t un) shift += bits; if (shift >= GMP_LIMB_BITS && ++i < un) - { - shift -= GMP_LIMB_BITS; - digit |= up[i] << (bits - shift); - } + { + shift -= GMP_LIMB_BITS; + digit |= up[i] << (bits - shift); + } sp[j] = digit & mask; } return sn; @@ -1246,7 +1254,7 @@ mpn_get_str_bits (unsigned char *sp, unsigned bits, mp_srcptr up, mp_size_t un) the end. */ static size_t mpn_limb_get_str (unsigned char *sp, mp_limb_t w, - const struct gmp_div_inverse *binv) + const struct gmp_div_inverse *binv) { mp_size_t i; for (i = 0; w > 0; i++) @@ -1267,8 +1275,8 @@ mpn_limb_get_str (unsigned char *sp, mp_limb_t w, static size_t mpn_get_str_other (unsigned char *sp, - int base, const struct mpn_base_info *info, - mp_ptr up, mp_size_t un) + int base, const struct mpn_base_info *info, + mp_ptr up, mp_size_t un) { struct gmp_div_inverse binv; size_t sn; @@ -1284,16 +1292,16 @@ mpn_get_str_other (unsigned char *sp, mpn_div_qr_1_invert (&bbinv, info->bb); do - { - mp_limb_t w; - size_t done; - w = mpn_div_qr_1_preinv (up, up, un, &bbinv); - un -= (up[un-1] == 0); - done = mpn_limb_get_str (sp + sn, w, &binv); - - for (sn += done; done < info->exp; done++) - sp[sn++] = 0; - } + { + mp_limb_t w; + size_t done; + w = mpn_div_qr_1_preinv (up, up, un, &bbinv); + un -= (up[un-1] == 0); + done = mpn_limb_get_str (sp + sn, w, &binv); + + for (sn += done; done < info->exp; done++) + sp[sn++] = 0; + } while (un > 1); } sn += mpn_limb_get_str (sp + sn, up[0], &binv); @@ -1331,7 +1339,7 @@ mpn_get_str (unsigned char *sp, int base, mp_ptr up, mp_size_t un) static mp_size_t mpn_set_str_bits (mp_ptr rp, const unsigned char *sp, size_t sn, - unsigned bits) + unsigned bits) { mp_size_t rn; mp_limb_t limb; @@ -1342,13 +1350,13 @@ mpn_set_str_bits (mp_ptr rp, const unsigned char *sp, size_t sn, limb |= (mp_limb_t) sp[sn] << shift; shift += bits; if (shift >= GMP_LIMB_BITS) - { - shift -= GMP_LIMB_BITS; - rp[rn++] = limb; - /* Next line is correct also if shift == 0, - bits == 8, and mp_limb_t == unsigned char. */ - limb = (unsigned int) sp[sn] >> (bits - shift); - } + { + shift -= GMP_LIMB_BITS; + rp[rn++] = limb; + /* Next line is correct also if shift == 0, + bits == 8, and mp_limb_t == unsigned char. */ + limb = (unsigned int) sp[sn] >> (bits - shift); + } } if (limb != 0) rp[rn++] = limb; @@ -1361,7 +1369,7 @@ mpn_set_str_bits (mp_ptr rp, const unsigned char *sp, size_t sn, case a single zero limb is written at *RP, and 1 is returned. */ static mp_size_t mpn_set_str_other (mp_ptr rp, const unsigned char *sp, size_t sn, - mp_limb_t b, const struct mpn_base_info *info) + mp_limb_t b, const struct mpn_base_info *info) { mp_size_t rn; mp_limb_t w; @@ -1385,12 +1393,12 @@ mpn_set_str_other (mp_ptr rp, const unsigned char *sp, size_t sn, w = sp[j++]; for (k = 1; k < info->exp; k++) - w = w * b + sp[j++]; + w = w * b + sp[j++]; cy = mpn_mul_1 (rp, rp, rn, info->bb); cy += mpn_add_1 (rp, rp, rn, w); if (cy > 0) - rp[rn++] = cy; + rp[rn++] = cy; } assert (j == sn); @@ -1422,11 +1430,11 @@ mpn_set_str (mp_ptr rp, const unsigned char *sp, size_t sn, int base) void mpz_init (mpz_t r) { - //static const mp_limb_t dummy_limb = GMP_LIMB_MAX & 0xc1a0; + static const mp_limb_t dummy_limb = GMP_LIMB_MAX & 0xc1a0; r->_mp_alloc = 0; r->_mp_size = 0; -// r->_mp_d = (mp_ptr) &dummy_limb; + r->_mp_d = (mp_ptr) &dummy_limb; } /* The utility of this function is a bit limited, since many functions @@ -1436,19 +1444,19 @@ mpz_init2 (mpz_t r, mp_bitcnt_t bits) { mp_size_t rn; - bits -= (bits != 0); /* Round down, except if 0 */ + bits -= (bits != 0); /* Round down, except if 0 */ rn = 1 + bits / GMP_LIMB_BITS; r->_mp_alloc = rn; r->_mp_size = 0; - // r->_mp_d = gmp_alloc_limbs (rn); + r->_mp_d = gmp_alloc_limbs (rn); } void mpz_clear (mpz_t r) { - // if (r->_mp_alloc) - // gmp_free_limbs (r->_mp_d, r->_mp_alloc); + if (r->_mp_alloc) + gmp_free_limbs (r->_mp_d, r->_mp_alloc); } static mp_ptr @@ -1456,11 +1464,11 @@ mpz_realloc (mpz_t r, mp_size_t size) { size = GMP_MAX (size, 1); - if (r->_mp_alloc) {} - // r->_mp_d = gmp_realloc_limbs (r->_mp_d, r->_mp_alloc, size); - else {} - // r->_mp_d = gmp_alloc_limbs (size); - //r->_mp_alloc = size; + if (r->_mp_alloc) + r->_mp_d = gmp_realloc_limbs (r->_mp_d, r->_mp_alloc, size); + else + r->_mp_d = gmp_alloc_limbs (size); + r->_mp_alloc = size; if (GMP_ABS (r->_mp_size) > size) r->_mp_size = 0; @@ -1469,7 +1477,9 @@ mpz_realloc (mpz_t r, mp_size_t size) } /* Realloc for an mpz_t WHAT if it has less than NEEDED limbs. */ -#define MPZ_REALLOC(z,n) (z)->_mp_d +#define MPZ_REALLOC(z,n) ((n) > (z)->_mp_alloc \ + ? mpz_realloc(z,n) \ + : (z)->_mp_d) /* MPZ assignment and basic conversions. */ void @@ -1480,8 +1490,8 @@ mpz_set_si (mpz_t r, signed long int x) else /* (x < 0) */ if (GMP_LIMB_BITS < GMP_ULONG_BITS) { - mpz_set_ui (r, GMP_NEG_CAST (unsigned long int, x)); - mpz_neg (r, r); + mpz_set_ui (r, GMP_NEG_CAST (unsigned long int, x)); + mpz_neg (r, r); } else { @@ -1498,14 +1508,14 @@ mpz_set_ui (mpz_t r, unsigned long int x) r->_mp_size = 1; MPZ_REALLOC (r, 1)[0] = x; if (GMP_LIMB_BITS < GMP_ULONG_BITS) - { - int LOCAL_GMP_LIMB_BITS = GMP_LIMB_BITS; - while (x >>= LOCAL_GMP_LIMB_BITS) - { - ++ r->_mp_size; - MPZ_REALLOC (r, r->_mp_size)[r->_mp_size - 1] = x; - } - } + { + int LOCAL_GMP_LIMB_BITS = GMP_LIMB_BITS; + while (x >>= LOCAL_GMP_LIMB_BITS) + { + ++ r->_mp_size; + MPZ_REALLOC (r, r->_mp_size)[r->_mp_size - 1] = x; + } + } } else r->_mp_size = 0; @@ -1622,7 +1632,7 @@ mpz_get_ui (const mpz_t u) mp_size_t n = GMP_ABS (u->_mp_size); n = GMP_MIN (n, 1 + (mp_size_t) (GMP_ULONG_BITS - 1) / GMP_LIMB_BITS); while (--n >= 0) - r = (r << LOCAL_GMP_LIMB_BITS) + u->_mp_d[n]; + r = (r << LOCAL_GMP_LIMB_BITS) + u->_mp_d[n]; return r; } @@ -1681,7 +1691,7 @@ static mpz_srcptr mpz_roinit_normal_n (mpz_t x, mp_srcptr xp, mp_size_t xs) { x->_mp_alloc = 0; - //x->_mp_d = (mp_ptr) xp; + x->_mp_d = (mp_ptr) xp; x->_mp_size = xs; return x; } @@ -1778,11 +1788,11 @@ mpz_get_d (const mpz_t u) { x = B*x; if (m > 0) { - l = u->_mp_d[un]; - m -= GMP_LIMB_BITS; - if (m < 0) - l &= GMP_LIMB_MAX << -m; - x += l; + l = u->_mp_d[un]; + m -= GMP_LIMB_BITS; + if (m < 0) + l &= GMP_LIMB_MAX << -m; + x += l; } } @@ -1811,24 +1821,24 @@ mpz_cmpabs_d (const mpz_t x, double d) /* Scale d so it can be compared with the top limb. */ for (i = 1; i < xn; i++) - d *= Bi; + d *= Bi; if (d >= B) - return -1; + return -1; /* Compare floor(d) to top limb, subtract and cancel when equal. */ for (i = xn; i-- > 0;) - { - mp_limb_t f, xl; - - f = (mp_limb_t) d; - xl = x->_mp_d[i]; - if (xl > f) - return 1; - else if (xl < f) - return -1; - d = B * (d - f); - } + { + mp_limb_t f, xl; + + f = (mp_limb_t) d; + xl = x->_mp_d[i]; + if (xl > f) + return 1; + else if (xl < f) + return -1; + d = B * (d - f); + } } return - (d > 0.0); } @@ -1839,16 +1849,16 @@ mpz_cmp_d (const mpz_t x, double d) if (x->_mp_size < 0) { if (d >= 0.0) - return -1; + return -1; else - return -mpz_cmpabs_d (x, d); + return -mpz_cmpabs_d (x, d); } else { if (d < 0.0) - return 1; + return 1; else - return mpz_cmpabs_d (x, d); + return mpz_cmpabs_d (x, d); } } @@ -1916,7 +1926,7 @@ int mpz_cmpabs (const mpz_t u, const mpz_t v) { return mpn_cmp4 (u->_mp_d, GMP_ABS (u->_mp_size), - v->_mp_d, GMP_ABS (v->_mp_size)); + v->_mp_d, GMP_ABS (v->_mp_size)); } void @@ -1936,16 +1946,8 @@ mpz_neg (mpz_t r, const mpz_t u) void mpz_swap (mpz_t u, mpz_t v) { - //MP_SIZE_T_SWAP (u->_mp_alloc, v->_mp_alloc); - //MPN_PTR_SWAP (u->_mp_d, u->_mp_size, v->_mp_d, v->_mp_size); - - mpz_t temp; - mpz_init(temp); - - *temp = *u; - *u = *v; - *v = *temp; - + MP_SIZE_T_SWAP (u->_mp_alloc, v->_mp_alloc); + MPN_PTR_SWAP (u->_mp_d, u->_mp_size, v->_mp_d, v->_mp_size); } @@ -2191,7 +2193,7 @@ enum mpz_div_round_mode { GMP_DIV_FLOOR, GMP_DIV_CEIL, GMP_DIV_TRUNC }; /* Allows q or r to be zero. Returns 1 iff remainder is non-zero. */ static int mpz_div_qr (mpz_t q, mpz_t r, - const mpz_t n, const mpz_t d, enum mpz_div_round_mode mode) + const mpz_t n, const mpz_t d, enum mpz_div_round_mode mode) { mp_size_t ns, ds, nn, dn, qs; ns = n->_mp_size; @@ -2203,9 +2205,9 @@ mpz_div_qr (mpz_t q, mpz_t r, if (ns == 0) { if (q) - q->_mp_size = 0; + q->_mp_size = 0; if (r) - r->_mp_size = 0; + r->_mp_size = 0; return 0; } @@ -2217,29 +2219,29 @@ mpz_div_qr (mpz_t q, mpz_t r, if (nn < dn) { if (mode == GMP_DIV_CEIL && qs >= 0) - { - /* q = 1, r = n - d */ - if (r) - mpz_sub (r, n, d); - if (q) - mpz_set_ui (q, 1); - } + { + /* q = 1, r = n - d */ + if (r) + mpz_sub (r, n, d); + if (q) + mpz_set_ui (q, 1); + } else if (mode == GMP_DIV_FLOOR && qs < 0) - { - /* q = -1, r = n + d */ - if (r) - mpz_add (r, n, d); - if (q) - mpz_set_si (q, -1); - } + { + /* q = -1, r = n + d */ + if (r) + mpz_add (r, n, d); + if (q) + mpz_set_si (q, -1); + } else - { - /* q = 0, r = d */ - if (r) - mpz_set (r, n); - if (q) - q->_mp_size = 0; - } + { + /* q = 0, r = d */ + if (r) + mpz_set (r, n); + if (q) + q->_mp_size = 0; + } return 1; } else @@ -2254,46 +2256,46 @@ mpz_div_qr (mpz_t q, mpz_t r, qn = nn - dn + 1; if (q) - { - mpz_init2 (tq, qn * GMP_LIMB_BITS); - qp = tq->_mp_d; - } + { + mpz_init2 (tq, qn * GMP_LIMB_BITS); + qp = tq->_mp_d; + } else - qp = NULL; + qp = NULL; mpn_div_qr (qp, np, nn, d->_mp_d, dn); if (qp) - { - qn -= (qp[qn-1] == 0); + { + qn -= (qp[qn-1] == 0); - tq->_mp_size = qs < 0 ? -qn : qn; - } + tq->_mp_size = qs < 0 ? -qn : qn; + } rn = mpn_normalized_size (np, dn); tr->_mp_size = ns < 0 ? - rn : rn; if (mode == GMP_DIV_FLOOR && qs < 0 && rn != 0) - { - if (q) - mpz_sub_ui (tq, tq, 1); - if (r) - mpz_add (tr, tr, d); - } + { + if (q) + mpz_sub_ui (tq, tq, 1); + if (r) + mpz_add (tr, tr, d); + } else if (mode == GMP_DIV_CEIL && qs >= 0 && rn != 0) - { - if (q) - mpz_add_ui (tq, tq, 1); - if (r) - mpz_sub (tr, tr, d); - } + { + if (q) + mpz_add_ui (tq, tq, 1); + if (r) + mpz_sub (tr, tr, d); + } if (q) - { - mpz_swap (tq, q); - mpz_clear (tq); - } + { + mpz_swap (tq, q); + mpz_clear (tq); + } if (r) - mpz_swap (tr, r); + mpz_swap (tr, r); mpz_clear (tr); @@ -2363,7 +2365,7 @@ mpz_mod (mpz_t r, const mpz_t n, const mpz_t d) static void mpz_div_q_2exp (mpz_t q, const mpz_t u, mp_bitcnt_t bit_index, - enum mpz_div_round_mode mode) + enum mpz_div_round_mode mode) { mp_size_t un, qn; mp_size_t limb_cnt; @@ -2384,9 +2386,9 @@ mpz_div_q_2exp (mpz_t q, const mpz_t u, mp_bitcnt_t bit_index, /* Note: Below, the final indexing at limb_cnt is valid because at that point we have qn > 0. */ adjust = (qn <= 0 - || !mpn_zero_p (u->_mp_d, limb_cnt) - || (u->_mp_d[limb_cnt] - & (((mp_limb_t) 1 << bit_index) - 1))); + || !mpn_zero_p (u->_mp_d, limb_cnt) + || (u->_mp_d[limb_cnt] + & (((mp_limb_t) 1 << bit_index) - 1))); else adjust = 0; @@ -2397,14 +2399,14 @@ mpz_div_q_2exp (mpz_t q, const mpz_t u, mp_bitcnt_t bit_index, qp = MPZ_REALLOC (q, qn); if (bit_index != 0) - { - mpn_rshift (qp, u->_mp_d + limb_cnt, qn, bit_index); - qn -= qp[qn - 1] == 0; - } + { + mpn_rshift (qp, u->_mp_d + limb_cnt, qn, bit_index); + qn -= qp[qn - 1] == 0; + } else - { - mpn_copyi (qp, u->_mp_d + limb_cnt, qn); - } + { + mpn_copyi (qp, u->_mp_d + limb_cnt, qn); + } } q->_mp_size = qn; @@ -2417,7 +2419,7 @@ mpz_div_q_2exp (mpz_t q, const mpz_t u, mp_bitcnt_t bit_index, static void mpz_div_r_2exp (mpz_t r, const mpz_t u, mp_bitcnt_t bit_index, - enum mpz_div_round_mode mode) + enum mpz_div_round_mode mode) { mp_size_t us, un, rn; mp_ptr rp; @@ -2440,46 +2442,46 @@ mpz_div_r_2exp (mpz_t r, const mpz_t u, mp_bitcnt_t bit_index, if (rn > un) { /* Quotient (with truncation) is zero, and remainder is - non-zero */ + non-zero */ if (mode == ((us > 0) ? GMP_DIV_CEIL : GMP_DIV_FLOOR)) /* us != 0 here. */ - { - /* Have to negate and sign extend. */ - mp_size_t i; + { + /* Have to negate and sign extend. */ + mp_size_t i; - gmp_assert_nocarry (! mpn_neg (rp, u->_mp_d, un)); - for (i = un; i < rn - 1; i++) - rp[i] = GMP_LIMB_MAX; + gmp_assert_nocarry (! mpn_neg (rp, u->_mp_d, un)); + for (i = un; i < rn - 1; i++) + rp[i] = GMP_LIMB_MAX; - rp[rn-1] = mask; - us = -us; - } + rp[rn-1] = mask; + us = -us; + } else - { - /* Just copy */ - if (r != u) - mpn_copyi (rp, u->_mp_d, un); + { + /* Just copy */ + if (r != u) + mpn_copyi (rp, u->_mp_d, un); - rn = un; - } + rn = un; + } } else { if (r != u) - mpn_copyi (rp, u->_mp_d, rn - 1); + mpn_copyi (rp, u->_mp_d, rn - 1); rp[rn-1] = u->_mp_d[rn-1] & mask; if (mode == ((us > 0) ? GMP_DIV_CEIL : GMP_DIV_FLOOR)) /* us != 0 here. */ - { - /* If r != 0, compute 2^{bit_count} - r. */ - mpn_neg (rp, rp, rn); + { + /* If r != 0, compute 2^{bit_count} - r. */ + mpn_neg (rp, rp, rn); - rp[rn-1] &= mask; + rp[rn-1] &= mask; - /* us is not used for anything else, so we can modify it - here to indicate flipped sign. */ - us = -us; - } + /* us is not used for anything else, so we can modify it + here to indicate flipped sign. */ + us = -us; + } } rn = mpn_normalized_size (rp, rn); r->_mp_size = us < 0 ? -rn : rn; @@ -2553,7 +2555,7 @@ mpz_congruent_p (const mpz_t a, const mpz_t b, const mpz_t m) static unsigned long mpz_div_qr_ui (mpz_t q, mpz_t r, - const mpz_t n, unsigned long d, enum mpz_div_round_mode mode) + const mpz_t n, unsigned long d, enum mpz_div_round_mode mode) { unsigned long ret; mpz_t rr, dd; @@ -2687,19 +2689,19 @@ mpn_gcd_11 (mp_limb_t u, mp_limb_t v) while (u != v) { if (u > v) - { - u -= v; - do - u >>= 1; - while ( (u & 1) == 0); - } + { + u -= v; + do + u >>= 1; + while ( (u & 1) == 0); + } else - { - v -= u; - do - v >>= 1; - while ( (v & 1) == 0); - } + { + v -= u; + do + v >>= 1; + while ( (v & 1) == 0); + } } return u << shift; } @@ -2771,30 +2773,30 @@ mpz_gcd (mpz_t g, const mpz_t u, const mpz_t v) else for (;;) { - int c; - - mpz_make_odd (tu); - c = mpz_cmp (tu, tv); - if (c == 0) - { - mpz_swap (g, tu); - break; - } - if (c < 0) - mpz_swap (tu, tv); - - if (tv->_mp_size == 1) - { - mp_limb_t *gp; - - mpz_tdiv_r (tu, tu, tv); - gp = MPZ_REALLOC (g, 1); /* gp = mpz_limbs_modify (g, 1); */ - *gp = mpn_gcd_11 (tu->_mp_d[0], tv->_mp_d[0]); - - g->_mp_size = *gp != 0; /* mpz_limbs_finish (g, 1); */ - break; - } - mpz_sub (tu, tu, tv); + int c; + + mpz_make_odd (tu); + c = mpz_cmp (tu, tv); + if (c == 0) + { + mpz_swap (g, tu); + break; + } + if (c < 0) + mpz_swap (tu, tv); + + if (tv->_mp_size == 1) + { + mp_limb_t *gp; + + mpz_tdiv_r (tu, tu, tv); + gp = MPZ_REALLOC (g, 1); /* gp = mpz_limbs_modify (g, 1); */ + *gp = mpn_gcd_11 (tu->_mp_d[0], tv->_mp_d[0]); + + g->_mp_size = *gp != 0; /* mpz_limbs_finish (g, 1); */ + break; + } + mpz_sub (tu, tu, tv); } mpz_clear (tu); mpz_clear (tv); @@ -2814,9 +2816,9 @@ mpz_gcdext (mpz_t g, mpz_t s, mpz_t t, const mpz_t u, const mpz_t v) signed long sign = mpz_sgn (v); mpz_abs (g, v); if (s) - s->_mp_size = 0; + s->_mp_size = 0; if (t) - mpz_set_si (t, sign); + mpz_set_si (t, sign); return; } @@ -2826,9 +2828,9 @@ mpz_gcdext (mpz_t g, mpz_t s, mpz_t t, const mpz_t u, const mpz_t v) signed long sign = mpz_sgn (u); mpz_abs (g, u); if (s) - mpz_set_si (s, sign); + mpz_set_si (s, sign); if (t) - t->_mp_size = 0; + t->_mp_size = 0; return; } @@ -2894,39 +2896,39 @@ mpz_gcdext (mpz_t g, mpz_t s, mpz_t t, const mpz_t u, const mpz_t v) power += shift; for (;;) - { - int c; - c = mpz_cmp (tu, tv); - if (c == 0) - break; - - if (c < 0) - { - /* tv = tv' + tu - * - * u = t0 tu + t1 (tv' + tu) = (t0 + t1) tu + t1 tv' - * v = s0 tu + s1 (tv' + tu) = (s0 + s1) tu + s1 tv' */ - - mpz_sub (tv, tv, tu); - mpz_add (t0, t0, t1); - mpz_add (s0, s0, s1); - - shift = mpz_make_odd (tv); - mpz_mul_2exp (t1, t1, shift); - mpz_mul_2exp (s1, s1, shift); - } - else - { - mpz_sub (tu, tu, tv); - mpz_add (t1, t0, t1); - mpz_add (s1, s0, s1); - - shift = mpz_make_odd (tu); - mpz_mul_2exp (t0, t0, shift); - mpz_mul_2exp (s0, s0, shift); - } - power += shift; - } + { + int c; + c = mpz_cmp (tu, tv); + if (c == 0) + break; + + if (c < 0) + { + /* tv = tv' + tu + * + * u = t0 tu + t1 (tv' + tu) = (t0 + t1) tu + t1 tv' + * v = s0 tu + s1 (tv' + tu) = (s0 + s1) tu + s1 tv' */ + + mpz_sub (tv, tv, tu); + mpz_add (t0, t0, t1); + mpz_add (s0, s0, s1); + + shift = mpz_make_odd (tv); + mpz_mul_2exp (t1, t1, shift); + mpz_mul_2exp (s1, s1, shift); + } + else + { + mpz_sub (tu, tu, tv); + mpz_add (t1, t0, t1); + mpz_add (s1, s0, s1); + + shift = mpz_make_odd (tu); + mpz_mul_2exp (t0, t0, shift); + mpz_mul_2exp (s0, s0, shift); + } + power += shift; + } } else mpz_setbit (t0, uz); @@ -2949,10 +2951,10 @@ mpz_gcdext (mpz_t g, mpz_t s, mpz_t t, const mpz_t u, const mpz_t v) { /* s0 u + t0 v = (s0 - v/g) u - (t0 + u/g) v */ if (mpz_odd_p (s0) || mpz_odd_p (t0)) - { - mpz_sub (s0, s0, s1); - mpz_add (t0, t0, t1); - } + { + mpz_sub (s0, s0, s1); + mpz_add (t0, t0, t1); + } assert (mpz_even_p (t0) && mpz_even_p (s0)); mpz_tdiv_q_2exp (s0, s0, 1); mpz_tdiv_q_2exp (t0, t0, 1); @@ -3038,12 +3040,12 @@ mpz_invert (mpz_t r, const mpz_t u, const mpz_t m) if (invertible) { if (tr->_mp_size < 0) - { - if (m->_mp_size >= 0) - mpz_add (tr, tr, m); - else - mpz_sub (tr, tr, m); - } + { + if (m->_mp_size >= 0) + mpz_add (tr, tr, m); + else + mpz_sub (tr, tr, m); + } mpz_swap (r, tr); } @@ -3067,7 +3069,7 @@ mpz_pow_ui (mpz_t r, const mpz_t b, unsigned long e) { mpz_mul (tr, tr, tr); if (e & bit) - mpz_mul (tr, tr, b); + mpz_mul (tr, tr, b); bit >>= 1; } while (bit > 0); @@ -3095,8 +3097,7 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) mp_srcptr mp; struct gmp_div_inverse minv; unsigned shift; - //mp_ptr tp = NULL; - mpz_t tp; + mp_ptr tp = NULL; en = GMP_ABS (e->_mp_size); mn = GMP_ABS (m->_mp_size); @@ -3116,13 +3117,12 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) if (shift > 0) { /* To avoid shifts, we do all our reductions, except the final - one, using a *normalized* m. */ + one, using a *normalized* m. */ minv.shift = 0; - //tp = gmp_alloc_limbs (mn); - - gmp_assert_nocarry (mpn_lshift (tp->_mp_d, mp, mn, shift)); - mp = tp->_mp_d; + tp = gmp_alloc_limbs (mn); + gmp_assert_nocarry (mpn_lshift (tp, mp, mn, shift)); + mp = tp; } mpz_init (base); @@ -3130,7 +3130,7 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) if (e->_mp_size < 0) { if (!mpz_invert (base, b, m)) - gmp_die ("mpz_powm: Negative exponent and non-invertible base."); + gmp_die ("mpz_powm: Negative exponent and non-invertible base."); } else { @@ -3139,20 +3139,20 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) bn = base->_mp_size; if (bn >= mn) - { - mpn_div_qr_preinv (NULL, base->_mp_d, base->_mp_size, mp, mn, &minv); - bn = mn; - } + { + mpn_div_qr_preinv (NULL, base->_mp_d, base->_mp_size, mp, mn, &minv); + bn = mn; + } /* We have reduced the absolute value. Now take care of the - sign. Note that we get zero represented non-canonically as - m. */ + sign. Note that we get zero represented non-canonically as + m. */ if (b->_mp_size < 0) - { - mp_ptr bp = MPZ_REALLOC (base, mn); - gmp_assert_nocarry (mpn_sub (bp, mp, mn, bp, bn)); - bn = mn; - } + { + mp_ptr bp = MPZ_REALLOC (base, mn); + gmp_assert_nocarry (mpn_sub (bp, mp, mn, bp, bn)); + bn = mn; + } base->_mp_size = mpn_normalized_size (base->_mp_d, bn); } mpz_init_set_ui (tr, 1); @@ -3164,17 +3164,17 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) bit = GMP_LIMB_HIGHBIT; do - { - mpz_mul (tr, tr, tr); - if (w & bit) - mpz_mul (tr, tr, base); - if (tr->_mp_size > mn) - { - mpn_div_qr_preinv (NULL, tr->_mp_d, tr->_mp_size, mp, mn, &minv); - tr->_mp_size = mpn_normalized_size (tr->_mp_d, mn); - } - bit >>= 1; - } + { + mpz_mul (tr, tr, tr); + if (w & bit) + mpz_mul (tr, tr, base); + if (tr->_mp_size > mn) + { + mpn_div_qr_preinv (NULL, tr->_mp_d, tr->_mp_size, mp, mn, &minv); + tr->_mp_size = mpn_normalized_size (tr->_mp_d, mn); + } + bit >>= 1; + } while (bit > 0); } @@ -3185,8 +3185,8 @@ mpz_powm (mpz_t r, const mpz_t b, const mpz_t e, const mpz_t m) mpn_div_qr_preinv (NULL, tr->_mp_d, tr->_mp_size, mp, mn, &minv); tr->_mp_size = mpn_normalized_size (tr->_mp_d, mn); } - //if (tp) - // gmp_free_limbs (tp, mn); + if (tp) + gmp_free_limbs (tp, mn); mpz_swap (r, tr); mpz_clear (tr); @@ -3232,11 +3232,11 @@ mpz_rootrem (mpz_t x, mpz_t r, const mpz_t y, unsigned long z) if (z == 2) /* simplify sqrt loop: z-1 == 1 */ do { - mpz_swap (u, t); /* u = x */ - mpz_tdiv_q (t, y, u); /* t = y/x */ - mpz_add (t, t, u); /* t = y/x + x */ - mpz_tdiv_q_2exp (t, t, 1); /* x'= (y/x + x)/2 */ - } while (mpz_cmpabs (t, u) < 0); /* |x'| < |x| */ + mpz_swap (u, t); /* u = x */ + mpz_tdiv_q (t, y, u); /* t = y/x */ + mpz_add (t, t, u); /* t = y/x + x */ + mpz_tdiv_q_2exp (t, t, 1); /* x'= (y/x + x)/2 */ + } while (mpz_cmpabs (t, u) < 0); /* |x'| < |x| */ else /* z != 2 */ { mpz_t v; @@ -3245,13 +3245,13 @@ mpz_rootrem (mpz_t x, mpz_t r, const mpz_t y, unsigned long z) mpz_neg (t, t); do { - mpz_swap (u, t); /* u = x */ - mpz_pow_ui (t, u, z - 1); /* t = x^(z-1) */ - mpz_tdiv_q (t, y, t); /* t = y/x^(z-1) */ - mpz_mul_ui (v, u, z - 1); /* v = x*(z-1) */ - mpz_add (t, t, v); /* t = y/x^(z-1) + x*(z-1) */ - mpz_tdiv_q_ui (t, t, z); /* x'=(y/x^(z-1) + x*(z-1))/z */ - } while (mpz_cmpabs (t, u) < 0); /* |x'| < |x| */ + mpz_swap (u, t); /* u = x */ + mpz_pow_ui (t, u, z - 1); /* t = x^(z-1) */ + mpz_tdiv_q (t, y, t); /* t = y/x^(z-1) */ + mpz_mul_ui (v, u, z - 1); /* v = x*(z-1) */ + mpz_add (t, t, v); /* t = y/x^(z-1) + x*(z-1) */ + mpz_tdiv_q_ui (t, t, z); /* x'=(y/x^(z-1) + x*(z-1))/z */ + } while (mpz_cmpabs (t, u) < 0); /* |x'| < |x| */ mpz_clear (v); } @@ -3405,18 +3405,18 @@ gmp_jacobi_coprime (mp_limb_t a, mp_limb_t b) /* (2/b) = -1 if b = 3 or 5 mod 8 */ bit ^= c & (b ^ (b >> 1)); if (a < b) - { - if (a == 0) - return bit & 1 ? -1 : 1; - bit ^= a & b; - a = b - a; - b -= a; - } + { + if (a == 0) + return bit & 1 ? -1 : 1; + bit ^= a & b; + a = b - a; + b -= a; + } else - { - a -= b; - assert (a != 0); - } + { + a -= b; + assert (a != 0); + } gmp_ctz(c, a); ++c; @@ -3441,7 +3441,7 @@ gmp_lucas_step_k_2k (mpz_t V, mpz_t Qk, const mpz_t n) /* Returns (U_k == 0) and sets V=V_k and Qk=Q^k. */ static int gmp_lucas_mod (mpz_t V, mpz_t Qk, long Q, - mp_bitcnt_t b0, const mpz_t n) + mp_bitcnt_t b0, const mpz_t n) { mp_bitcnt_t bs; mpz_t U; @@ -3465,27 +3465,27 @@ gmp_lucas_mod (mpz_t V, mpz_t Qk, long Q, /* Q^{2k} = (Q^k)^2 */ gmp_lucas_step_k_2k (V, Qk, n); - /* A step k->k+1 is performed if the bit in $n$ is 1 */ - /* mpz_tstbit(n,bs) or the bit is 0 in $n$ but */ - /* should be 1 in $n+1$ (bs == b0) */ + /* A step k->k+1 is performed if the bit in $n$ is 1 */ + /* mpz_tstbit(n,bs) or the bit is 0 in $n$ but */ + /* should be 1 in $n+1$ (bs == b0) */ if (b0 == bs || mpz_tstbit (n, bs)) - { - /* Q^{k+1} <- Q^k * Q */ - mpz_mul_si (Qk, Qk, Q); - /* U_{k+1} <- (U_k + V_k) / 2 */ - mpz_swap (U, V); /* Keep in V the old value of U_k */ - mpz_add (U, U, V); - /* We have to compute U/2, so we need an even value, */ - /* equivalent (mod n) */ - if (mpz_odd_p (U)) - mpz_add (U, U, n); - mpz_tdiv_q_2exp (U, U, 1); - /* V_{k+1} <-(D*U_k + V_k) / 2 = - U_{k+1} + (D-1)/2*U_k = U_{k+1} - 2Q*U_k */ - mpz_mul_si (V, V, -2*Q); - mpz_add (V, U, V); - mpz_tdiv_r (V, V, n); - } + { + /* Q^{k+1} <- Q^k * Q */ + mpz_mul_si (Qk, Qk, Q); + /* U_{k+1} <- (U_k + V_k) / 2 */ + mpz_swap (U, V); /* Keep in V the old value of U_k */ + mpz_add (U, U, V); + /* We have to compute U/2, so we need an even value, */ + /* equivalent (mod n) */ + if (mpz_odd_p (U)) + mpz_add (U, U, n); + mpz_tdiv_q_2exp (U, U, 1); + /* V_{k+1} <-(D*U_k + V_k) / 2 = + U_{k+1} + (D-1)/2*U_k = U_{k+1} - 2Q*U_k */ + mpz_mul_si (V, V, -2*Q); + mpz_add (V, U, V); + mpz_tdiv_r (V, V, n); + } mpz_tdiv_r (U, U, n); } @@ -3524,11 +3524,11 @@ gmp_stronglucas (const mpz_t x, mpz_t Qk) do { if (D >= maxD) - return 1 + (D != GMP_LIMB_MAX); /* (1 + ! ~ D) */ + return 1 + (D != GMP_LIMB_MAX); /* (1 + ! ~ D) */ D += 2; tl = mpz_tdiv_ui (n, D); if (tl == 0) - return 0; + return 0; } while (gmp_jacobi_coprime (tl, D) == 1); @@ -3541,8 +3541,8 @@ gmp_stronglucas (const mpz_t x, mpz_t Qk) /* D= P^2 - 4Q; P = 1; Q = (1-D)/4 */ Q = (D & 2) ? (long) (D >> 2) + 1 : -(long) (D >> 2); - if (! gmp_lucas_mod (V, Qk, Q, b0, n)) /* If Ud != 0 */ - while (V->_mp_size != 0 && --b0 != 0) /* while Vk != 0 */ + if (! gmp_lucas_mod (V, Qk, Q, b0, n)) /* If Ud != 0 */ + while (V->_mp_size != 0 && --b0 != 0) /* while Vk != 0 */ /* V <- V ^ 2 - 2Q^k */ /* Q^{2k} = (Q^k)^2 */ gmp_lucas_step_k_2k (V, Qk, n); @@ -3553,7 +3553,7 @@ gmp_stronglucas (const mpz_t x, mpz_t Qk) static int gmp_millerrabin (const mpz_t n, const mpz_t nm1, mpz_t y, - const mpz_t q, mp_bitcnt_t k) + const mpz_t q, mp_bitcnt_t k) { assert (k > 0); @@ -3567,7 +3567,7 @@ gmp_millerrabin (const mpz_t n, const mpz_t nm1, mpz_t y, { mpz_powm_ui (y, y, 2, n); if (mpz_cmp (y, nm1) == 0) - return 1; + return 1; } return 0; } @@ -3631,12 +3631,12 @@ mpz_probab_prime_p (const mpz_t n, int reps) { mpz_set_ui (y, (unsigned long) j*j+j+41); if (mpz_cmp (y, nm1) >= 0) - { - /* Don't try any further bases. This "early" break does not affect - the result for any reasonable reps value (<=5000 was tested) */ - assert (j >= 30); - break; - } + { + /* Don't try any further bases. This "early" break does not affect + the result for any reasonable reps value (<=5000 was tested) */ + assert (j >= 30); + break; + } is_prime = gmp_millerrabin (n, nm1, y, q, k); } mpz_clear (nm1); @@ -3694,12 +3694,12 @@ mpz_tstbit (const mpz_t d, mp_bitcnt_t bit_index) if (ds < 0) { /* d < 0. Check if any of the bits below is set: If so, our bit - must be complemented. */ + must be complemented. */ if (shift > 0 && (mp_limb_t) (w << (GMP_LIMB_BITS - shift)) > 0) - return bit ^ 1; + return bit ^ 1; while (--limb_index >= 0) - if (d->_mp_d[limb_index] > 0) - return bit ^ 1; + if (d->_mp_d[limb_index] > 0) + return bit ^ 1; } return bit; } @@ -3720,12 +3720,12 @@ mpz_abs_add_bit (mpz_t d, mp_bitcnt_t bit_index) { mp_size_t i; /* The bit should be set outside of the end of the number. - We have to increase the size of the number. */ + We have to increase the size of the number. */ dp = MPZ_REALLOC (d, limb_index + 1); dp[limb_index] = bit; for (i = dn; i < limb_index; i++) - dp[i] = 0; + dp[i] = 0; dn = limb_index + 1; } else @@ -3736,10 +3736,10 @@ mpz_abs_add_bit (mpz_t d, mp_bitcnt_t bit_index) cy = mpn_add_1 (dp + limb_index, dp + limb_index, dn - limb_index, bit); if (cy > 0) - { - dp = MPZ_REALLOC (d, dn + 1); - dp[dn++] = cy; - } + { + dp = MPZ_REALLOC (d, dn + 1); + dp[dn++] = cy; + } } d->_mp_size = (d->_mp_size < 0) ? - dn : dn; @@ -3761,7 +3761,7 @@ mpz_abs_sub_bit (mpz_t d, mp_bitcnt_t bit_index) assert (limb_index < dn); gmp_assert_nocarry (mpn_sub_1 (dp + limb_index, dp + limb_index, - dn - limb_index, bit)); + dn - limb_index, bit)); dn = mpn_normalized_size (dp, dn); d->_mp_size = (d->_mp_size < 0) ? - dn : dn; } @@ -3772,9 +3772,9 @@ mpz_setbit (mpz_t d, mp_bitcnt_t bit_index) if (!mpz_tstbit (d, bit_index)) { if (d->_mp_size >= 0) - mpz_abs_add_bit (d, bit_index); + mpz_abs_add_bit (d, bit_index); else - mpz_abs_sub_bit (d, bit_index); + mpz_abs_sub_bit (d, bit_index); } } @@ -3784,9 +3784,9 @@ mpz_clrbit (mpz_t d, mp_bitcnt_t bit_index) if (mpz_tstbit (d, bit_index)) { if (d->_mp_size >= 0) - mpz_abs_sub_bit (d, bit_index); + mpz_abs_sub_bit (d, bit_index); else - mpz_abs_add_bit (d, bit_index); + mpz_abs_add_bit (d, bit_index); } } @@ -3810,7 +3810,7 @@ void mpz_and (mpz_t r, const mpz_t u, const mpz_t v) { mp_size_t un, vn, rn, i; - mp_ptr up, vp, rp; + mp_ptr up, vp, rp; mp_limb_t ux, vx, rx; mp_limb_t uc, vc, rc; @@ -3842,8 +3842,8 @@ mpz_and (mpz_t r, const mpz_t u, const mpz_t v) rp = MPZ_REALLOC (r, rn + (mp_size_t) rc); - up = *(mp_ptr *)u->_mp_d; - vp = *(mp_ptr *)v->_mp_d; + up = u->_mp_d; + vp = v->_mp_d; i = 0; do @@ -3915,8 +3915,8 @@ mpz_ior (mpz_t r, const mpz_t u, const mpz_t v) rp = MPZ_REALLOC (r, rn + (mp_size_t) rc); - up = *(mp_ptr *)u->_mp_d; - vp = *(mp_ptr *)v->_mp_d; + up = u->_mp_d; + vp = v->_mp_d; i = 0; do @@ -3984,8 +3984,8 @@ mpz_xor (mpz_t r, const mpz_t u, const mpz_t v) rp = MPZ_REALLOC (r, un + (mp_size_t) rc); - up = *(mp_ptr *)u->_mp_d; - vp = *(mp_ptr *)v->_mp_d; + up = u->_mp_d; + vp = v->_mp_d; i = 0; do @@ -4035,9 +4035,9 @@ gmp_popcount_limb (mp_limb_t x) w = ((w >> 8) & 0x000f) + (w & 0x000f); c += w; if (GMP_LIMB_BITS > LOCAL_SHIFT_BITS) - x >>= LOCAL_SHIFT_BITS; + x >>= LOCAL_SHIFT_BITS; else - x = 0; + x = 0; } return c; } @@ -4134,18 +4134,18 @@ mpz_scan1 (const mpz_t u, mp_bitcnt_t starting_bit) if (i >= un) return (us >= 0 ? ~(mp_bitcnt_t) 0 : starting_bit); - up = *(mp_ptr *)u->_mp_d; + up = u->_mp_d; ux = 0; limb = up[i]; if (starting_bit != 0) { if (us < 0) - { - ux = mpn_zero_p (up, i); - limb = ~ limb + ux; - ux = - (mp_limb_t) (limb >= ux); - } + { + ux = mpn_zero_p (up, i); + limb = ~ limb + ux; + ux = - (mp_limb_t) (limb >= ux); + } /* Mask to 0 all bits before starting_bit, thus ignoring them. */ limb &= GMP_LIMB_MAX << (starting_bit % GMP_LIMB_BITS); @@ -4171,7 +4171,7 @@ mpz_scan0 (const mpz_t u, mp_bitcnt_t starting_bit) if (i >= un) return (ux ? starting_bit : ~(mp_bitcnt_t) 0); - up = *(mp_ptr *)u->_mp_d; + up = u->_mp_d; limb = up[i] ^ ux; if (ux == 0) @@ -4191,8 +4191,7 @@ mpz_sizeinbase (const mpz_t u, int base) { mp_size_t un, tn; mp_srcptr up; - //mp_ptr tp; - mpz_t tp; + mp_ptr tp; mp_bitcnt_t bits; struct gmp_div_inverse bi; size_t ndigits; @@ -4220,11 +4219,11 @@ mpz_sizeinbase (const mpz_t u, int base) case 32: return (bits + 4) / 5; /* FIXME: Do something more clever for the common case of base - 10. */ + 10. */ } - //tp = gmp_alloc_limbs (un); - mpn_copyi (tp->_mp_d, up, un); + tp = gmp_alloc_limbs (un); + mpn_copyi (tp, up, un); mpn_div_qr_1_invert (&bi, base); tn = un; @@ -4232,12 +4231,12 @@ mpz_sizeinbase (const mpz_t u, int base) do { ndigits++; - mpn_div_qr_1_preinv (tp->_mp_d, tp->_mp_d, tn, &bi); - tn -= (tp->_mp_d[tn-1] == 0); + mpn_div_qr_1_preinv (tp, tp, tn, &bi); + tn -= (tp[tn-1] == 0); } while (tn > 0); - // gmp_free_limbs (tp, un); + gmp_free_limbs (tp, un); return ndigits; } @@ -4253,9 +4252,9 @@ mpz_get_str (char *sp, int base, const mpz_t u) if (base > 1) { if (base <= 36) - digits = "0123456789abcdefghijklmnopqrstuvwxyz"; + digits = "0123456789abcdefghijklmnopqrstuvwxyz"; else if (base > 62) - return NULL; + return NULL; } else if (base >= -1) base = 10; @@ -4263,7 +4262,7 @@ mpz_get_str (char *sp, int base, const mpz_t u) { base = -base; if (base > 36) - return NULL; + return NULL; } sn = 1 + mpz_sizeinbase (u, base); @@ -4316,20 +4315,6 @@ ret: return sp; } - -int strlen_c(const char *c) { - - // rather naive implementation – we assume a string is terminated, and is not 0 characters long. - - int i = 0; - while (1) { - if (c[i] == '\0') - return i; - i++; - } - return i; -} - int mpz_set_str (mpz_t r, const char *sp, int base) { @@ -4351,22 +4336,22 @@ mpz_set_str (mpz_t r, const char *sp, int base) if (base == 0) { if (sp[0] == '0') - { - if (sp[1] == 'x' || sp[1] == 'X') - { - base = 16; - sp += 2; - } - else if (sp[1] == 'b' || sp[1] == 'B') - { - base = 2; - sp += 2; - } - else - base = 8; - } + { + if (sp[1] == 'x' || sp[1] == 'X') + { + base = 16; + sp += 2; + } + else if (sp[1] == 'b' || sp[1] == 'B') + { + base = 2; + sp += 2; + } + else + base = 8; + } else - base = 10; + base = 10; } if (!*sp) @@ -4383,22 +4368,22 @@ mpz_set_str (mpz_t r, const char *sp, int base) unsigned digit; if (isspace ((unsigned char) *sp)) - continue; + continue; else if (*sp >= '0' && *sp <= '9') - digit = *sp - '0'; + digit = *sp - '0'; else if (*sp >= 'a' && *sp <= 'z') - digit = *sp - 'a' + value_of_a; + digit = *sp - 'a' + value_of_a; else if (*sp >= 'A' && *sp <= 'Z') - digit = *sp - 'A' + 10; + digit = *sp - 'A' + 10; else - digit = base; /* fail */ + digit = base; /* fail */ if (digit >= (unsigned) base) - { - gmp_free (dp, sn); - r->_mp_size = 0; - return -1; - } + { + gmp_free (dp, sn); + r->_mp_size = 0; + return -1; + } dp[dn++] = digit; } @@ -4470,7 +4455,7 @@ gmp_detect_endian (void) /* Import and export. Does not support nails. */ void mpz_import (mpz_t r, size_t count, int order, size_t size, int endian, - size_t nails, const void *src) + size_t nails, const void *src) { const unsigned char *p; ptrdiff_t word_step; @@ -4517,15 +4502,15 @@ mpz_import (mpz_t r, size_t count, int order, size_t size, int endian, { size_t j; for (j = 0; j < size; j++, p -= (ptrdiff_t) endian) - { - limb |= (mp_limb_t) *p << (bytes++ * CHAR_BIT); - if (bytes == sizeof(mp_limb_t)) - { - rp[i++] = limb; - bytes = 0; - limb = 0; - } - } + { + limb |= (mp_limb_t) *p << (bytes++ * CHAR_BIT); + if (bytes == sizeof(mp_limb_t)) + { + rp[i++] = limb; + bytes = 0; + limb = 0; + } + } } assert (i + (bytes > 0) == rn); if (limb != 0) @@ -4538,7 +4523,7 @@ mpz_import (mpz_t r, size_t count, int order, size_t size, int endian, void * mpz_export (void *r, size_t *countp, int order, size_t size, int endian, - size_t nails, const mpz_t u) + size_t nails, const mpz_t u) { size_t count; mp_size_t un; @@ -4572,65 +4557,65 @@ mpz_export (void *r, size_t *countp, int order, size_t size, int endian, k = (GMP_LIMB_BITS <= CHAR_BIT); if (!k) - { - do { - int LOCAL_CHAR_BIT = CHAR_BIT; - k++; limb >>= LOCAL_CHAR_BIT; - } while (limb != 0); - } + { + do { + int LOCAL_CHAR_BIT = CHAR_BIT; + k++; limb >>= LOCAL_CHAR_BIT; + } while (limb != 0); + } /* else limb = 0; */ count = (k + (un-1) * sizeof (mp_limb_t) + size - 1) / size; if (!r) - r = gmp_alloc (count * size); + r = gmp_alloc (count * size); if (endian == 0) - endian = gmp_detect_endian (); + endian = gmp_detect_endian (); p = (unsigned char *) r; word_step = (order != endian) ? 2 * size : 0; /* Process bytes from the least significant end, so point p at the - least significant word. */ + least significant word. */ if (order == 1) - { - p += size * (count - 1); - word_step = - word_step; - } + { + p += size * (count - 1); + word_step = - word_step; + } /* And at least significant byte of that word. */ if (endian == 1) - p += (size - 1); + p += (size - 1); for (bytes = 0, i = 0, k = 0; k < count; k++, p += word_step) - { - size_t j; - for (j = 0; j < size; ++j, p -= (ptrdiff_t) endian) - { - if (sizeof (mp_limb_t) == 1) - { - if (i < un) - *p = u->_mp_d[i++]; - else - *p = 0; - } - else - { - int LOCAL_CHAR_BIT = CHAR_BIT; - if (bytes == 0) - { - if (i < un) - limb = u->_mp_d[i++]; - bytes = sizeof (mp_limb_t); - } - *p = limb; - limb >>= LOCAL_CHAR_BIT; - bytes--; - } - } - } + { + size_t j; + for (j = 0; j < size; ++j, p -= (ptrdiff_t) endian) + { + if (sizeof (mp_limb_t) == 1) + { + if (i < un) + *p = u->_mp_d[i++]; + else + *p = 0; + } + else + { + int LOCAL_CHAR_BIT = CHAR_BIT; + if (bytes == 0) + { + if (i < un) + limb = u->_mp_d[i++]; + bytes = sizeof (mp_limb_t); + } + *p = limb; + limb >>= LOCAL_CHAR_BIT; + bytes--; + } + } + } assert (i == un); assert (k == count); } @@ -4640,4 +4625,3 @@ mpz_export (void *r, size_t *countp, int order, size_t size, int endian, return r; } - diff --git a/source/gmp.h b/source/gmp.h @@ -0,0 +1,310 @@ +/* mini-gmp, a minimalistic implementation of a GNU GMP subset. + +Copyright 2011-2015, 2017, 2019-2021 Free Software Foundation, Inc. + +This file is part of the GNU MP Library. + +The GNU MP Library is free software; you can redistribute it and/or modify +it under the terms of either: + + * the GNU Lesser General Public License as published by the Free + Software Foundation; either version 3 of the License, or (at your + option) any later version. + +or + + * the GNU General Public License as published by the Free Software + Foundation; either version 2 of the License, or (at your option) any + later version. + +or both in parallel, as here. + +The GNU MP Library is distributed in the hope that it will be useful, but +WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +for more details. + +You should have received copies of the GNU General Public License and the +GNU Lesser General Public License along with the GNU MP Library. If not, +see https://www.gnu.org/licenses/. */ + +/* About mini-gmp: This is a minimal implementation of a subset of the + GMP interface. It is intended for inclusion into applications which + have modest bignums needs, as a fallback when the real GMP library + is not installed. + + This file defines the public interface. */ + +#ifndef __MINI_GMP_H__ +#define __MINI_GMP_H__ + +/* For size_t */ +#include <stddef.h> + +#if defined (__cplusplus) +extern "C" { +#endif + +void mp_set_memory_functions (void *(*) (size_t), + void *(*) (void *, size_t, size_t), + void (*) (void *, size_t)); + +void mp_get_memory_functions (void *(**) (size_t), + void *(**) (void *, size_t, size_t), + void (**) (void *, size_t)); + +#ifndef MINI_GMP_LIMB_TYPE +#define MINI_GMP_LIMB_TYPE long +#endif + +typedef unsigned MINI_GMP_LIMB_TYPE mp_limb_t; +typedef long mp_size_t; +typedef unsigned long mp_bitcnt_t; + +typedef mp_limb_t *mp_ptr; +typedef const mp_limb_t *mp_srcptr; + +typedef struct +{ + int _mp_alloc; /* Number of *limbs* allocated and pointed + to by the _mp_d field. */ + int _mp_size; /* abs(_mp_size) is the number of limbs the + last field points to. If _mp_size is + negative this is a negative number. */ + mp_limb_t *_mp_d; /* Pointer to the limbs. */ +} __mpz_struct; + +typedef __mpz_struct mpz_t[1]; + +typedef __mpz_struct *mpz_ptr; +typedef const __mpz_struct *mpz_srcptr; + +extern const int mp_bits_per_limb; + +void mpn_copyi (mp_ptr, mp_srcptr, mp_size_t); +void mpn_copyd (mp_ptr, mp_srcptr, mp_size_t); +void mpn_zero (mp_ptr, mp_size_t); + +int mpn_cmp (mp_srcptr, mp_srcptr, mp_size_t); +int mpn_zero_p (mp_srcptr, mp_size_t); + +mp_limb_t mpn_add_1 (mp_ptr, mp_srcptr, mp_size_t, mp_limb_t); +mp_limb_t mpn_add_n (mp_ptr, mp_srcptr, mp_srcptr, mp_size_t); +mp_limb_t mpn_add (mp_ptr, mp_srcptr, mp_size_t, mp_srcptr, mp_size_t); + +mp_limb_t mpn_sub_1 (mp_ptr, mp_srcptr, mp_size_t, mp_limb_t); +mp_limb_t mpn_sub_n (mp_ptr, mp_srcptr, mp_srcptr, mp_size_t); +mp_limb_t mpn_sub (mp_ptr, mp_srcptr, mp_size_t, mp_srcptr, mp_size_t); + +mp_limb_t mpn_mul_1 (mp_ptr, mp_srcptr, mp_size_t, mp_limb_t); +mp_limb_t mpn_addmul_1 (mp_ptr, mp_srcptr, mp_size_t, mp_limb_t); +mp_limb_t mpn_submul_1 (mp_ptr, mp_srcptr, mp_size_t, mp_limb_t); + +mp_limb_t mpn_mul (mp_ptr, mp_srcptr, mp_size_t, mp_srcptr, mp_size_t); +void mpn_mul_n (mp_ptr, mp_srcptr, mp_srcptr, mp_size_t); +void mpn_sqr (mp_ptr, mp_srcptr, mp_size_t); +int mpn_perfect_square_p (mp_srcptr, mp_size_t); +mp_size_t mpn_sqrtrem (mp_ptr, mp_ptr, mp_srcptr, mp_size_t); + +mp_limb_t mpn_lshift (mp_ptr, mp_srcptr, mp_size_t, unsigned int); +mp_limb_t mpn_rshift (mp_ptr, mp_srcptr, mp_size_t, unsigned int); + +mp_bitcnt_t mpn_scan0 (mp_srcptr, mp_bitcnt_t); +mp_bitcnt_t mpn_scan1 (mp_srcptr, mp_bitcnt_t); + +void mpn_com (mp_ptr, mp_srcptr, mp_size_t); +mp_limb_t mpn_neg (mp_ptr, mp_srcptr, mp_size_t); + +mp_bitcnt_t mpn_popcount (mp_srcptr, mp_size_t); + +mp_limb_t mpn_invert_3by2 (mp_limb_t, mp_limb_t); +#define mpn_invert_limb(x) mpn_invert_3by2 ((x), 0) + +size_t mpn_get_str (unsigned char *, int, mp_ptr, mp_size_t); +mp_size_t mpn_set_str (mp_ptr, const unsigned char *, size_t, int); + +void mpz_init (mpz_t); +void mpz_init2 (mpz_t, mp_bitcnt_t); +void mpz_clear (mpz_t); + +#define mpz_odd_p(z) (((z)->_mp_size != 0) & (int) (z)->_mp_d[0]) +#define mpz_even_p(z) (! mpz_odd_p (z)) + +int mpz_sgn (const mpz_t); +int mpz_cmp_si (const mpz_t, long); +int mpz_cmp_ui (const mpz_t, unsigned long); +int mpz_cmp (const mpz_t, const mpz_t); +int mpz_cmpabs_ui (const mpz_t, unsigned long); +int mpz_cmpabs (const mpz_t, const mpz_t); +int mpz_cmp_d (const mpz_t, double); +int mpz_cmpabs_d (const mpz_t, double); + +void mpz_abs (mpz_t, const mpz_t); +void mpz_neg (mpz_t, const mpz_t); +void mpz_swap (mpz_t, mpz_t); + +void mpz_add_ui (mpz_t, const mpz_t, unsigned long); +void mpz_add (mpz_t, const mpz_t, const mpz_t); +void mpz_sub_ui (mpz_t, const mpz_t, unsigned long); +void mpz_ui_sub (mpz_t, unsigned long, const mpz_t); +void mpz_sub (mpz_t, const mpz_t, const mpz_t); + +void mpz_mul_si (mpz_t, const mpz_t, long int); +void mpz_mul_ui (mpz_t, const mpz_t, unsigned long int); +void mpz_mul (mpz_t, const mpz_t, const mpz_t); +void mpz_mul_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_addmul_ui (mpz_t, const mpz_t, unsigned long int); +void mpz_addmul (mpz_t, const mpz_t, const mpz_t); +void mpz_submul_ui (mpz_t, const mpz_t, unsigned long int); +void mpz_submul (mpz_t, const mpz_t, const mpz_t); + +void mpz_cdiv_qr (mpz_t, mpz_t, const mpz_t, const mpz_t); +void mpz_fdiv_qr (mpz_t, mpz_t, const mpz_t, const mpz_t); +void mpz_tdiv_qr (mpz_t, mpz_t, const mpz_t, const mpz_t); +void mpz_cdiv_q (mpz_t, const mpz_t, const mpz_t); +void mpz_fdiv_q (mpz_t, const mpz_t, const mpz_t); +void mpz_tdiv_q (mpz_t, const mpz_t, const mpz_t); +void mpz_cdiv_r (mpz_t, const mpz_t, const mpz_t); +void mpz_fdiv_r (mpz_t, const mpz_t, const mpz_t); +void mpz_tdiv_r (mpz_t, const mpz_t, const mpz_t); + +void mpz_cdiv_q_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_fdiv_q_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_tdiv_q_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_cdiv_r_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_fdiv_r_2exp (mpz_t, const mpz_t, mp_bitcnt_t); +void mpz_tdiv_r_2exp (mpz_t, const mpz_t, mp_bitcnt_t); + +void mpz_mod (mpz_t, const mpz_t, const mpz_t); + +void mpz_divexact (mpz_t, const mpz_t, const mpz_t); + +int mpz_divisible_p (const mpz_t, const mpz_t); +int mpz_congruent_p (const mpz_t, const mpz_t, const mpz_t); + +unsigned long mpz_cdiv_qr_ui (mpz_t, mpz_t, const mpz_t, unsigned long); +unsigned long mpz_fdiv_qr_ui (mpz_t, mpz_t, const mpz_t, unsigned long); +unsigned long mpz_tdiv_qr_ui (mpz_t, mpz_t, const mpz_t, unsigned long); +unsigned long mpz_cdiv_q_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_fdiv_q_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_tdiv_q_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_cdiv_r_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_fdiv_r_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_tdiv_r_ui (mpz_t, const mpz_t, unsigned long); +unsigned long mpz_cdiv_ui (const mpz_t, unsigned long); +unsigned long mpz_fdiv_ui (const mpz_t, unsigned long); +unsigned long mpz_tdiv_ui (const mpz_t, unsigned long); + +unsigned long mpz_mod_ui (mpz_t, const mpz_t, unsigned long); + +void mpz_divexact_ui (mpz_t, const mpz_t, unsigned long); + +int mpz_divisible_ui_p (const mpz_t, unsigned long); + +unsigned long mpz_gcd_ui (mpz_t, const mpz_t, unsigned long); +void mpz_gcd (mpz_t, const mpz_t, const mpz_t); +void mpz_gcdext (mpz_t, mpz_t, mpz_t, const mpz_t, const mpz_t); +void mpz_lcm_ui (mpz_t, const mpz_t, unsigned long); +void mpz_lcm (mpz_t, const mpz_t, const mpz_t); +int mpz_invert (mpz_t, const mpz_t, const mpz_t); + +void mpz_sqrtrem (mpz_t, mpz_t, const mpz_t); +void mpz_sqrt (mpz_t, const mpz_t); +int mpz_perfect_square_p (const mpz_t); + +void mpz_pow_ui (mpz_t, const mpz_t, unsigned long); +void mpz_ui_pow_ui (mpz_t, unsigned long, unsigned long); +void mpz_powm (mpz_t, const mpz_t, const mpz_t, const mpz_t); +void mpz_powm_ui (mpz_t, const mpz_t, unsigned long, const mpz_t); + +void mpz_rootrem (mpz_t, mpz_t, const mpz_t, unsigned long); +int mpz_root (mpz_t, const mpz_t, unsigned long); + +void mpz_fac_ui (mpz_t, unsigned long); +void mpz_2fac_ui (mpz_t, unsigned long); +void mpz_mfac_uiui (mpz_t, unsigned long, unsigned long); +void mpz_bin_uiui (mpz_t, unsigned long, unsigned long); + +int mpz_probab_prime_p (const mpz_t, int); + +int mpz_tstbit (const mpz_t, mp_bitcnt_t); +void mpz_setbit (mpz_t, mp_bitcnt_t); +void mpz_clrbit (mpz_t, mp_bitcnt_t); +void mpz_combit (mpz_t, mp_bitcnt_t); + +void mpz_com (mpz_t, const mpz_t); +void mpz_and (mpz_t, const mpz_t, const mpz_t); +void mpz_ior (mpz_t, const mpz_t, const mpz_t); +void mpz_xor (mpz_t, const mpz_t, const mpz_t); + +mp_bitcnt_t mpz_popcount (const mpz_t); +mp_bitcnt_t mpz_hamdist (const mpz_t, const mpz_t); +mp_bitcnt_t mpz_scan0 (const mpz_t, mp_bitcnt_t); +mp_bitcnt_t mpz_scan1 (const mpz_t, mp_bitcnt_t); + +int mpz_fits_slong_p (const mpz_t); +int mpz_fits_ulong_p (const mpz_t); +int mpz_fits_sint_p (const mpz_t); +int mpz_fits_uint_p (const mpz_t); +int mpz_fits_sshort_p (const mpz_t); +int mpz_fits_ushort_p (const mpz_t); +long int mpz_get_si (const mpz_t); +unsigned long int mpz_get_ui (const mpz_t); +double mpz_get_d (const mpz_t); +size_t mpz_size (const mpz_t); +mp_limb_t mpz_getlimbn (const mpz_t, mp_size_t); + +void mpz_realloc2 (mpz_t, mp_bitcnt_t); +mp_srcptr mpz_limbs_read (mpz_srcptr); +mp_ptr mpz_limbs_modify (mpz_t, mp_size_t); +mp_ptr mpz_limbs_write (mpz_t, mp_size_t); +void mpz_limbs_finish (mpz_t, mp_size_t); +mpz_srcptr mpz_roinit_n (mpz_t, mp_srcptr, mp_size_t); + +#define MPZ_ROINIT_N(xp, xs) {{0, (xs),(xp) }} + +void mpz_set_si (mpz_t, signed long int); +void mpz_set_ui (mpz_t, unsigned long int); +void mpz_set (mpz_t, const mpz_t); +void mpz_set_d (mpz_t, double); + +void mpz_init_set_si (mpz_t, signed long int); +void mpz_init_set_ui (mpz_t, unsigned long int); +void mpz_init_set (mpz_t, const mpz_t); +void mpz_init_set_d (mpz_t, double); + +size_t mpz_sizeinbase (const mpz_t, int); +char *mpz_get_str (char *, int, const mpz_t); +int mpz_set_str (mpz_t, const char *, int); +int mpz_init_set_str (mpz_t, const char *, int); + +/* This long list taken from gmp.h. */ +/* For reference, "defined(EOF)" cannot be used here. In g++ 2.95.4, + <iostream> defines EOF but not FILE. */ +#if defined (FILE) \ + || defined (H_STDIO) \ + || defined (_H_STDIO) /* AIX */ \ + || defined (_STDIO_H) /* glibc, Sun, SCO */ \ + || defined (_STDIO_H_) /* BSD, OSF */ \ + || defined (__STDIO_H) /* Borland */ \ + || defined (__STDIO_H__) /* IRIX */ \ + || defined (_STDIO_INCLUDED) /* HPUX */ \ + || defined (__dj_include_stdio_h_) /* DJGPP */ \ + || defined (_FILE_DEFINED) /* Microsoft */ \ + || defined (__STDIO__) /* Apple MPW MrC */ \ + || defined (_MSL_STDIO_H) /* Metrowerks */ \ + || defined (_STDIO_H_INCLUDED) /* QNX4 */ \ + || defined (_ISO_STDIO_ISO_H) /* Sun C++ */ \ + || defined (__STDIO_LOADED) /* VMS */ \ + || defined (_STDIO) /* HPE NonStop */ \ + || defined (__DEFINED_FILE) /* musl */ +size_t mpz_out_str (FILE *, int, const mpz_t); +#endif + +void mpz_import (mpz_t, size_t, int, size_t, int, size_t, const void *); +void *mpz_export (void *, size_t *, int, size_t, int, size_t, const mpz_t); + +#if defined (__cplusplus) +} +#endif +#endif /* __MINI_GMP_H__ */ diff --git a/source/lib-gpu-verify.c b/source/lib-gpu-verify.c @@ -10,6 +10,7 @@ #include "reference-test.h" #include "montgomery-test.h" +#include "montmodmult.h" int main(int argc, char** argv) @@ -19,12 +20,12 @@ int main(int argc, char** argv) setup_gcry(); - + mont_modmult_tests(); // MARK: might have memory issues - mont_rsa_tests(); + //mont_rsa_tests(); - //rsa_tests(); + rsa_tests(); //reference_tests(); diff --git a/source/montgomery-test.c b/source/montgomery-test.c @@ -7,7 +7,7 @@ #include "montgomery-test.h" -#include "gmp.h" // has been adapted +#include <gmp.h> // has been adapted void mont_pairs_from_files(void *bases, unsigned long *b_off, void *exponents, unsigned long *e_off, diff --git a/source/montgomery.h b/source/montgomery.h @@ -10,7 +10,7 @@ #include <stdio.h> -#include "gmp.h" +#include <gmp.h> #include <assert.h> diff --git a/source/montmodmult.c b/source/montmodmult.c @@ -6,3 +6,619 @@ // #include "montmodmult.h" +#include "util.h" + +static unsigned long len_in_bytes = 0; + +#define ORDER -1 // I think we need to do this, because we want to write it in the 'wrong' way +#define END 0 + +#define BIT_LENGTH 2048 + +#define BITS 64 + +// sizes are always the same 32 units for all, except exp_buf +void montmodmult_pairs_from_files(void *x_buf, void *m_buf, + void *r_1_buf, + void *n_buf, void *ni_buf, + void *msg_buf, + void *exp_buf, + void *mod_buf, + void *s_buf, + unsigned long *pks, unsigned long *n) { + + FILE * pk; + FILE * ms; + + pk = fopen("lib-gpu-generate/publickey.txt", "r"); + ms = fopen("lib-gpu-generate/msgsig.txt", "r"); + + fseek (ms, 0, SEEK_END); + long ms_l = ftell(ms); + fseek (ms, 0, SEEK_SET); + char *ms_ptr = malloc(ms_l); + char *ms_ptr_rest = malloc(ms_l); + if (ms_ptr || ms_ptr_rest) + { + fread (ms_ptr, 1, ms_l, ms); + memcpy(ms_ptr_rest, ms_ptr, ms_l); + } + fclose (ms); + + fseek (pk, 0, SEEK_END); + long pk_l = ftell(pk); + fseek (pk, 0, SEEK_SET); + char *pk_ptr = malloc(pk_l); + char *pk_ptr_rest = malloc(pk_l); + if (pk_ptr && pk_ptr_rest) + { + fread (pk_ptr, 1, pk_l, pk); + memcpy(pk_ptr_rest, pk_ptr, pk_l); + } + fclose (pk); + + gpu_register *x_buf_t = x_buf; + gpu_register *m_buf_t = m_buf; + gpu_register *r_1_buf_t = r_1_buf; + + gpu_register *ni_buf_t = ni_buf; + gpu_register *n_buf_t = n_buf; + gpu_register *msg_buf_t = msg_buf; + gpu_register *s_buf_t = s_buf; + gpu_register *mod_buf_t = mod_buf; + gpu_register *exp_buf_t = exp_buf; + + int len = (BIT_LENGTH / 8) / sizeof(gpu_register); + + char* message = strtok_r(ms_ptr, "\n", &ms_ptr_rest); + char* signature = strtok_r(0, "\n", &ms_ptr_rest); + char* modulus = strtok_r(pk_ptr, "\n", &pk_ptr_rest); + char* exponent = strtok_r(0, "\n", &pk_ptr_rest); + char* offs = strtok_r(0, "\n", &pk_ptr_rest); + + int i = 0; + int j = 0; + + mpz_t e,mod,msg,s; + + mpz_init(e); + mpz_init(mod); + mpz_init(msg); + mpz_init(s); + + mpz_t r, r_1, ni, M, x, N; + mpz_t NN; + + mpz_init(r); + mpz_init(r_1); + mpz_init(ni); + mpz_init(M); + mpz_init(x); + mpz_init(N); + mpz_init(NN); + + mpz_t one; // some helper variables + mpz_init_set_si(one,1); + + + // N is a constant for a given field (2048) + mpz_mul_2exp(N,one,2043); // r + mpz_mul_2exp(NN,one,44); // r + + mpz_add(N, N, NN); + mpz_add_ui(N, N, 1); // N = 2^2044 + 2^45 + 1 + + while (message != NULL && signature != NULL) { + + if (i == 0 || pks[j - 1] < i) { + + mpz_set_str(mod,modulus,16); + mpz_set_str(e,exponent,16); + + pks[j] = atoi(offs); + + modulus = strtok_r(0, "\n", &pk_ptr_rest); + exponent = strtok_r(0, "\n", &pk_ptr_rest); + offs = strtok_r(0, "\n", &pk_ptr_rest); + + // MARK: into montgomery domain + + + mpz_set_si(one, 1); + + + + mpz_mul_2exp(r,one,BIT_LENGTH); // r + + mpz_gcdext(one, r_1, ni, r, mod); // set r_1 and ni + + // MARK: n' is negative – fix that + + int sgn = mpz_sgn(r_1); + + mpz_abs(r_1, r_1); + mpz_abs(ni, ni); + + if (sgn == -1) { + mpz_sub(ni, r, ni); + mpz_sub(r_1, N, r_1); + } + + // MARK: export + + // exponent as is and mod -> n, ni -> ni, r_1 -> r_1 + + mpz_export(&n_buf_t[len * j], NULL, ORDER, sizeof(gpu_register), END, 0, mod); + mpz_export(&mod_buf_t[len * j], NULL, ORDER, sizeof(gpu_register), END, 0, mod); + mpz_export(&ni_buf_t[len * j], NULL, ORDER, sizeof(gpu_register), END, 0, ni); + mpz_export(&r_1_buf_t[len * j], NULL, ORDER, sizeof(gpu_register), END, 0, r_1); + mpz_export(&exp_buf_t[j], NULL, ORDER, sizeof(gpu_register), END, 0, e); + + j++; + + } + + mpz_set_str(msg,message,16); + mpz_set_str(s,signature,16); + + message = strtok_r(0, "\n",&ms_ptr_rest); + signature = strtok_r(0, "\n",&ms_ptr_rest); + + // set x (the number to 'square' (multiply by itself)) + mpz_mul(x, s, r); + mpz_mod(x, x, mod); + + // message as is and 'signature' -> x , M -> m + mpz_export(&msg_buf_t[len * i], NULL, ORDER, sizeof(gpu_register), END, 0, msg); + mpz_export(&s_buf_t[len * i], NULL, ORDER, sizeof(gpu_register), END, 0, s); + mpz_export(&x_buf_t[len * i], NULL, ORDER, sizeof(gpu_register), END, 0, s); + mpz_export(&m_buf_t[len * i], NULL, ORDER, sizeof(gpu_register), END, 0, s); + + + + + + i++; + } + + mpz_clear(e); + mpz_clear(mod); + mpz_clear(msg); + mpz_clear(s); + + mpz_clear(r); + mpz_clear(r_1); + mpz_clear(ni); + mpz_clear(M); + mpz_clear(x); + + mpz_clear(N); + mpz_clear(NN); + + mpz_clear(one); + + *n = i; + +} + + +int modmult_opencl_prepare(struct gpu_info *info, struct gpu_state_alt *state, + void *x_buf, void *m_buf, + //void *r_1_buf, + void *n_buf, void *ni_buf, + void *msg_buf, + void *exp_buf, + void *mod_buf, + void *s_buf, + unsigned long *pks, unsigned long n + ) { + + int err; // error code returned from api calls + + unsigned long pk = 0; + + while (1) { + if (pks[pk] + 1 >= n) + break; + pk++; + } + + unsigned long len = len_in_bytes; + + state->x_mem = clCreateBuffer(info->context, CL_MEM_READ_WRITE, len, NULL, NULL); + state->m_mem = clCreateBuffer(info->context, CL_MEM_READ_ONLY, len, NULL, NULL); + + //state->res_mem = clCreateBuffer(info->context, CL_MEM_READ_WRITE, len, NULL, NULL); // the result that is written back + state->n_mem = clCreateBuffer(info->context, CL_MEM_READ_ONLY, len, NULL, NULL); + state->ni_mem = clCreateBuffer(info->context, CL_MEM_READ_ONLY, len, NULL, NULL); + + state->exp_mem = clCreateBuffer(info->context, CL_MEM_READ_ONLY, n * sizeof(gpu_register), NULL, NULL); + + state->tmp_1 = clCreateBuffer(info->context, CL_MEM_READ_WRITE, len * 2, NULL, NULL); + state->tmp_2 = clCreateBuffer(info->context, CL_MEM_READ_WRITE, len * 2, NULL, NULL); + + state->pks_indices = clCreateBuffer(info->context, CL_MEM_READ_ONLY, sizeof(unsigned long) * (pk + 1),NULL, NULL); + + if (!state->x_mem || !state->m_mem || !state->n_mem || !state->ni_mem || !state->exp_mem || !state->tmp_1 || !state->tmp_2) + { + printf("Error: Failed to allocate device memory!\n"); + exit(1); + } + + void *tmp_1 = malloc(len * 2); + void *tmp_2 = malloc(len * 2); + + //void *res = malloc(len); + + memset(tmp_1, 0, len * 2); + memset(tmp_2, 0, len * 2); + //memset(res, 0, len); + + // Write our data set into the input array in device memory + // + err = clEnqueueWriteBuffer(info->commands, state->x_mem, CL_TRUE, 0, len, x_buf, 0, NULL, NULL); + err |= clEnqueueWriteBuffer(info->commands, state->m_mem, CL_TRUE, 0, len, m_buf, 0, NULL, NULL); + + //err |= clEnqueueWriteBuffer(info->commands, state->res_mem, CL_TRUE, 0, len, res, 0, NULL, NULL); + err |= clEnqueueWriteBuffer(info->commands, state->n_mem, CL_TRUE, 0, len, n_buf, 0, NULL, NULL); + err |= clEnqueueWriteBuffer(info->commands, state->ni_mem, CL_TRUE, 0, len, ni_buf, 0, NULL, NULL); + + err |= clEnqueueWriteBuffer(info->commands, state->exp_mem, CL_TRUE, 0, n * sizeof(gpu_register), exp_buf, 0, NULL, NULL); + + err |= clEnqueueWriteBuffer(info->commands, state->tmp_1, CL_TRUE, 0, len * 2, tmp_1, 0, NULL, NULL); + err |= clEnqueueWriteBuffer(info->commands, state->tmp_2, CL_TRUE, 0, len * 2, tmp_2, 0, NULL, NULL); + + err |= clEnqueueWriteBuffer(info->commands, state->pks_indices, CL_TRUE, 0, sizeof(unsigned long) * (pk + 1), pks, 0, NULL, NULL); + if (err != CL_SUCCESS) + { + printf("Error: Failed to write to source array!\n"); + exit(1); + } + + free(tmp_1); + free(tmp_2); + //free(res); + + // Set the arguments to our compute kernel + // + err = 0; + err = clSetKernelArg(info->kernel, 0, sizeof(cl_mem), &state->x_mem); + err |= clSetKernelArg(info->kernel, 1, sizeof(cl_mem), &state->m_mem); + //err |= clSetKernelArg(info->kernel, 2, sizeof(cl_mem), &state->res_mem); + err |= clSetKernelArg(info->kernel, 3, sizeof(cl_mem), &state->n_mem); + err |= clSetKernelArg(info->kernel, 4, sizeof(cl_mem), &state->ni_mem); + err |= clSetKernelArg(info->kernel, 5, sizeof(cl_mem), &state->exp_mem); + err |= clSetKernelArg(info->kernel, 6, sizeof(cl_mem), &state->tmp_1); + err |= clSetKernelArg(info->kernel, 7, sizeof(cl_mem), &state->tmp_2); + err |= clSetKernelArg(info->kernel, 8, sizeof(cl_mem), &state->pks_indices); + //err |= clSetKernelArg(info->kernel, 9, sizeof(unsigned long), &n); + + + if (err != CL_SUCCESS) + { + printf("RSA-Error: Failed to set kernel arguments! %d\n", err); + exit(1); + } + + state->total = n; + + + return 0; + +} + +int modmult_opencl_exec_kernel(struct gpu_info *info, struct gpu_state_alt *state) { + + size_t global; + // size_t local; + int err; + + // MARK: deal with size limitations + + size_t modifier = (BIT_LENGTH / 8) / sizeof(gpu_register); + + // MARK: testing with one kernel, and a loop that simulates work items + + //global = state->total % len == 0? state->total : state->total + state->total % len; + global = state->total; // has to be exactly the amount of signatures we want to verify + + // measure from the first call to the kernel... + if (state->skip) { + state->skip = false; + clock_gettime(CLOCK_REALTIME, &state->t1); + } + + err = clEnqueueNDRangeKernel(info->commands, info->kernel, 1, NULL, &global, NULL, 0, NULL, NULL); + if (err) + { + printf("Error: Failed to execute kernel!\n"); + return EXIT_FAILURE; + } + + printf("KERNEL IS EXECUTING...\n"); + + return 0; + +} + +unsigned long modmult_opencl_results(struct gpu_info *info, struct gpu_state_alt *state, bool timed, void * msg_buf, void * r_1_buf, void * n_buf, void* s_buf, void *mod_buf, unsigned long n) { + + if (state->skip) { + // reset skip in the kernel execution + return 0; + } + + int err; + + // Wait for the command commands to get serviced before reading back results + // + err = clFinish(info->commands); + if (err != CL_SUCCESS) + { + printf("Error: Kernel failure! %d\n", err); + exit(1); + } + + + + void *results = malloc(len_in_bytes); + memset(results, 0, len_in_bytes); + + + // Read back the results from the device to verify the output + err = clEnqueueReadBuffer(info->commands, state->res_mem, CL_TRUE, 0, len_in_bytes, results, 0, NULL, NULL ); + if (err != CL_SUCCESS) + { + printf("Error: Failed to read output array! %d\n", err); + exit(1); + } + + // MARK: convert out of montgomery + + mpz_t ret,a,r_1,mod,N; + + mpz_init(ret); + mpz_init(a); + mpz_init(r_1); + mpz_init(mod); + mpz_init(N); + + //mpz_export(&n_buf_t[len * j], NULL, 1, sizeof(gpu_register), 0, 0, mod); + + int len = (BIT_LENGTH / 8) / sizeof(gpu_register); + + for (int i = 0; i < n; i++) { + + mpz_import(a, len, ORDER, sizeof(gpu_register), END, 0, &results[i * len]); + mpz_import(r_1, len, ORDER, sizeof(gpu_register), END, 0, &r_1_buf[i * len]); + mpz_import(N, len, ORDER, sizeof(gpu_register), END, 0, &n_buf[i * len]); + mpz_import(mod, len, ORDER, sizeof(gpu_register), END, 0, &mod_buf[i * len]); + + // mpz_mul(ret, a, r_1); + // mpz_mod(ret, ret, mod); + + } + + gmp_printf ("ret in decimal: %Zd\n", a); + + // test reference + + mpz_t sig, sig_tmp, one, r; + mpz_init(sig); + mpz_init(sig_tmp); + + mpz_init(one); + mpz_init(r); + + mpz_import(sig, len, ORDER, sizeof(gpu_register), END, 0, s_buf); + + mpz_set_si(one, 1); + mpz_mul_2exp(r,one,BIT_LENGTH); // r + + mpz_mul(sig, sig, sig); + mpz_mod(sig, sig, r); + + gmp_printf ("ref: %Zd\n", sig); + + + printf(""); + + mpz_clear(ret); + mpz_clear(a); + mpz_clear(r_1); + mpz_clear(mod); + + mpz_clear(one); + + + + + + + + + if (timed) { + // stop measuring after the last command has been read + clock_gettime(CLOCK_REALTIME, &state->t2); + + printf("GPU verification took %ld.%06ld s\n", ( state->t2.tv_nsec < state->t1.tv_nsec ? state->t2.tv_sec - (state->t1.tv_sec + 1) : state->t2.tv_sec - state->t1.tv_sec ), ( state->t2.tv_nsec < state->t1.tv_nsec ? ((999999999 - state->t1.tv_nsec) + state->t2.tv_nsec) : (state->t2.tv_nsec - state->t1.tv_nsec) ) / 1000); + + } + + + return 0; + +} + +void modmult_opencl_cleanup(struct gpu_info *info) { + + clReleaseProgram(info->program); + clReleaseKernel(info->kernel); + clReleaseCommandQueue(info->commands); + clReleaseContext(info->context); + +} + +void modmult_opencl_release(struct gpu_state_alt *state) { + + clReleaseMemObject(state->x_mem); + clReleaseMemObject(state->m_mem); + //clReleaseMemObject(state->res_mem); + clReleaseMemObject(state->n_mem); + clReleaseMemObject(state->ni_mem); + clReleaseMemObject(state->exp_mem); + + clReleaseMemObject(state->tmp_1); + clReleaseMemObject(state->tmp_2); + + clReleaseMemObject(state->pks_indices); +} + +// MARK: for library + +void modmult_gpu_init(struct gpu_info *info, struct gpu_state_alt *state) { + + info->platform = select_platform(0, false); + info->device_id = select_device (info->platform); + info->context = create_compute_context (info->device_id); + info->commands = create_command_queue (info->device_id, info->context); + info->program = compile_program (info->device_id, info->context, "montmodmult.cl"); + info->kernel = create_kernel (info->program, "mont"); + + state->result = 0; + state->total = 0; + state->skip = true; + + int err = 0; + + void *results = malloc(len_in_bytes); + memset(results, 0, len_in_bytes); + + state->res_mem = clCreateBuffer(info->context, CL_MEM_READ_WRITE, len_in_bytes ,NULL, NULL); + + err |= clEnqueueWriteBuffer(info->commands, state->res_mem, CL_TRUE, 0, len_in_bytes, results, 0, NULL, NULL); + if (err != CL_SUCCESS) + { + printf("Error: Failed to write to source array!\n"); + exit(1); + } + + err |= clSetKernelArg(info->kernel, 2, sizeof(cl_mem), &state->res_mem); + if (err != CL_SUCCESS) + { + printf("Error: Failed to set kernel arguments! %d\n", err); + exit(1); + } +} + +void modmult_gpu_execute(struct gpu_info *info, struct gpu_state_alt *state, + void *x_buf, void *m_buf, + void *r_1_buf, + void *n_buf, void *ni_buf, + void *msg_buf, + void *exp_buf, + void *mod_buf, + void *s_buf, + unsigned long *pks, unsigned long n) { + + modmult_opencl_prepare(info, state, + x_buf, m_buf, + //r_1_buf, + n_buf, ni_buf, + msg_buf, exp_buf, mod_buf, s_buf, + pks, n + ); // prepares the next batch of signatures on CPU, naturally blocks until it's finished + + state->result += modmult_opencl_results(info, state, false, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n); // waits for kernel, if it is not ready yet + modmult_opencl_exec_kernel(info,state); // start kernel (returns immediately) + modmult_opencl_release(state); // release buffers + + + +} + +unsigned long modmult_gpu_finish(struct gpu_info *info, struct gpu_state_alt *state, void * msg_buf, void * r_1_buf, void * n_buf, void *mod_buf, void* s_buf, unsigned long n) { + + state->result += modmult_opencl_results(info,state,true,msg_buf,r_1_buf,n_buf, s_buf, mod_buf, n); + + modmult_opencl_cleanup(info); + //clReleaseMemObject(state->invalid); + + unsigned long res = state->result; + + state->result = 0; // reset result + + return res; + +} + + +int mont_modmult_tests(void) { + + unsigned long pairs = number_of_pairs(); // returns an estimation of pairs + + unsigned long digit_sz = (BIT_LENGTH / 8) * pairs; + + len_in_bytes = digit_sz; + + unsigned long arr_sz = pairs * sizeof(unsigned long); + + gpu_register *x_buf = malloc(digit_sz); + gpu_register *m_buf = malloc(digit_sz); + gpu_register *r_1_buf = malloc(digit_sz); + gpu_register *n_buf = malloc(digit_sz); + gpu_register *ni_buf = malloc(digit_sz); + gpu_register *msg_buf = malloc(digit_sz); + gpu_register *s_buf = malloc(digit_sz); + gpu_register *mod_buf = malloc(digit_sz); + gpu_register *exp_buf = malloc(pairs * sizeof(gpu_register)); + + memset(x_buf, 0, digit_sz); + memset(m_buf, 0, digit_sz); + memset(r_1_buf, 0, digit_sz); + memset(n_buf, 0, digit_sz); + memset(ni_buf, 0, digit_sz); + memset(msg_buf, 0, digit_sz); + memset(s_buf, 0, digit_sz); + memset(mod_buf, 0, digit_sz); + memset(exp_buf, 0, digit_sz * sizeof(gpu_register)); + + unsigned long *pks = malloc(arr_sz); + + memset(pks, 0, arr_sz); + + printf("READING KEYS...\n"); + + montmodmult_pairs_from_files(x_buf, m_buf, + r_1_buf, + n_buf, ni_buf, + msg_buf, exp_buf, mod_buf, s_buf, + pks, &pairs); + + printf("VERIFYING %lu SIGNATURES...\n", pairs); + + struct gpu_info info; + struct gpu_state_alt state; + + modmult_gpu_init(&info, &state); + + modmult_gpu_execute(&info, &state, + x_buf, m_buf, + r_1_buf, + n_buf, ni_buf, + msg_buf, exp_buf, mod_buf, s_buf, + pks, pairs); + + unsigned long res = modmult_gpu_finish(&info, &state, msg_buf, r_1_buf, n_buf, mod_buf,s_buf, pairs); + + if (res == pairs) { + printf("VERIFICATION RESULT: %lu - OK\n\n",res); + } else { + printf("VERIFICATION RESULT: %lu - NOT OK\n\n",res); + } + + + + printf(""); + +} diff --git a/source/montmodmult.h b/source/montmodmult.h @@ -9,5 +9,12 @@ #define montmodmult_h #include <stdio.h> +#include "ctype.h" +#include <gmp.h> + +int mont_modmult_tests(void); + + +typedef u_int64_t gpu_register; #endif /* montmodmult_h */ diff --git a/source/rsa-test.c b/source/rsa-test.c @@ -335,7 +335,7 @@ int opencl_prepare(struct gpu_info *info, struct gpu_state *state, err |= clSetKernelArg(info->kernel, 5, sizeof(cl_mem), &state->mod_len); err |= clSetKernelArg(info->kernel, 6, sizeof(cl_mem), &state->comp_mem); err |= clSetKernelArg(info->kernel, 7, sizeof(cl_mem), &state->comp_len); - //err |= clSetKernelArg(info->kernel, 8, sizeof(cl_mem), &state->valid); + //err |= clSetKernelArg(info->kernel, 8, sizeof(cl_mem), &state->valid); -> set somewhere else err |= clSetKernelArg(info->kernel, 9, sizeof(cl_mem), &state->pks_indices); err |= clSetKernelArg(info->kernel, 10, sizeof(unsigned long), &n); diff --git a/source/rsa-test.h b/source/rsa-test.h @@ -12,41 +12,6 @@ #include "ctype.h" -struct gpu_info { - - cl_platform_id platform; - cl_device_id device_id; - cl_context context; - cl_command_queue commands; - cl_program program; - cl_kernel kernel; - -}; - -struct gpu_state { - - cl_mem invalid; - - cl_mem sig_mem; - cl_mem exp_mem; - cl_mem mod_mem; - cl_mem comp_mem; - - cl_mem sig_len; - cl_mem exp_len; - cl_mem mod_len; - cl_mem comp_len; - - cl_mem pks_indices; - - struct timespec t1, t2; - - unsigned long total; // 0 - unsigned long result; // 0 - - bool skip; - -}; int rsa_tests(void); diff --git a/source/util.h b/source/util.h @@ -66,4 +66,66 @@ create_kernel (cl_program program, const char *name); +struct gpu_info { + + cl_platform_id platform; + cl_device_id device_id; + cl_context context; + cl_command_queue commands; + cl_program program; + cl_kernel kernel; + +}; + +struct gpu_state { + + cl_mem invalid; + + cl_mem sig_mem; + cl_mem exp_mem; + cl_mem mod_mem; + cl_mem comp_mem; + + cl_mem sig_len; + cl_mem exp_len; + cl_mem mod_len; + cl_mem comp_len; + + cl_mem pks_indices; + + struct timespec t1, t2; + + unsigned long total; // 0 + unsigned long result; // 0 + + bool skip; + +}; + +struct gpu_state_alt { + + // cl_mem invalid; + + cl_mem x_mem; + cl_mem m_mem; + cl_mem res_mem; + cl_mem n_mem; + cl_mem ni_mem; + //cl_mem msg_mem; + cl_mem exp_mem; + + cl_mem tmp_1; + cl_mem tmp_2; + + cl_mem pks_indices; + + struct timespec t1, t2; + + unsigned long total; // 0 + unsigned long result; // 0 + + bool skip; + +}; + #endif /* util_h */ diff --git a/xcode/.DS_Store b/xcode/.DS_Store Binary files differ. diff --git a/xcode/lib-gpu-generate/msgsig.txt b/xcode/lib-gpu-generate/msgsig.txt @@ -1,2 +1,2 @@ -3DB82611F0AA4549 -0083ECD7379021AE99FFCF028CC1EBF96542B931D8C3F245EF64FE7423238D90D423C1F33E1D6CA24C0ADB8302D18A98DAAB565E49E81ED08937D3C7B7AF4AA1F832397EC0EFF11118AA159AF722B030EA5F614CE458DE575A4DEC70A94539B789E60F5B6CF0F146B1FB01C5F0583571BB21592E08E195488FE83AB18E40003A7285DA710157FFB64D577051B3BD88BA0B867CA402F910BDF35440F7A83024E4A261AD6E79E3B3312C0BDB23EEA6DBFA6A81CFB2635AE801815B24EED2E08A0CA4877037776CF0FB5079BF12CE721DBBB66DE87C5ACB24E01AC751E5853AEEE6BEA1CC60E1A68836108EA11B79BC4FEB2F2F47591C1A2E552C74BAA714382610EC +9506E0DF73 +7134105D4E8706C01F2EDE5C773E2A250A269D2DA99BAB49AC8D5FF9AEA2E059D4D66F514452DEA37AB39E2D5B65281CB6566850548E5DCA87ABD5FC171D56BD1DB449A257D1CA2ECBA66C8232B4A2F1E590427CA3E451188A036A49346D8AFFA48A4F90DA6D26B22CECEE53FD8951CA101D937598C292B380CE836C8B6D992ABE0DC5AD4240C9E01BD441F359374C15A0D30BC296F56C79D85157AC00B339A8C4B2414300A131B023ED30EDFFD9CFA6FEBCBC724D5C88C3FC89815654526D28D41871AC7FC4514F4FCC6789404A3F13661A3DA4B311AB6AF547673D5FD13E544377A8960E6360E76DEF3788BD3356720EF514DCD2BBD1C4950385A2104BA984 diff --git a/xcode/lib-gpu-generate/publickey.txt b/xcode/lib-gpu-generate/publickey.txt @@ -1,3 +1,3 @@ -00AACCE8836848B3FE12D67F155B2EF70734C8D6E374C78300167C5F3062CC76D43F0E74281142784343BE313261A50B4B23CBC45D5F8BF88025C07BD4F02FC557E370A47775820307845F179F49592EC466C6FC33A59F9E05B1B70BCC1F5F62431B5BFF0F02377A1C94E4B8E92C249402B74EAD7CAF30D4DA2144B9B1357A7A9944540E1A1D1805E767C693B0D3D3267072DCF51AE61A0AB08E453095C3A623DD50C727EF2F74788DAE6E73613F5D7329E68B9BB3BBE770E1093FCE9A43B32DFC2975B648D9A2A89A0FED9DB41C7898FA3AEFC35602A8A96C1E84C9766C06E1F58641010EF8FCB7B93709795678988A9EDA6191D43E927D13AED334B964D05F3B -010001 +00CA5F6FD970F17AAEA1F2272368C1CE27E2252F7357C651AAC203EA012D888CED38F4F1B97DB332E005E291D845DECBD3846A3E09F0FEBCDC71D31A735874F9848974814474055FA200F6D42B715AFD9E04C4DA1FF2457020EEB4753E44318AF4E41111923B007FCBB1E2E17898E00AD500BFF849E7360B0249DA98A3D7301E12C6A2C33925078E783336263AC07A3EED6594414736E01DFA621CBB93E1C548E539AF8D0FB87AE0F8181B9C38046E01508F2865333305BDC8C177F3D7A1CF677F11F6115D45792AFF2BAFFB36CC700757AC262C29F76D0869DF5B6258D754237DBE492236251599D3ACB500F0764021881BD1F1777143F6D73B63D7B9AD67CB2B +02 0 diff --git a/xcode/lib-gpu-verify.xcodeproj/project.pbxproj b/xcode/lib-gpu-verify.xcodeproj/project.pbxproj @@ -9,11 +9,12 @@ /* Begin PBXBuildFile section */ 6A36F8892B0F938E00AB772D /* montgomery.cl in Sources */ = {isa = PBXBuildFile; fileRef = 6A36F8882B0F938E00AB772D /* montgomery.cl */; }; 6A8A795F2A89672700116D7D /* verify.cl in Sources */ = {isa = PBXBuildFile; fileRef = 6A8A795E2A89672700116D7D /* verify.cl */; }; - 6A99B06E2B1293DA0004E4B7 /* gmp.c in Sources */ = {isa = PBXBuildFile; fileRef = 6A7914CB2B0CF320001EDCC1 /* gmp.c */; }; 6AA38E5B2B0A97FC00E85243 /* main.c in Sources */ = {isa = PBXBuildFile; fileRef = 6AA38E5A2B0A97FC00E85243 /* main.c */; }; 6AB4D99D2B1645F900A686F2 /* montgomery-test.c in Sources */ = {isa = PBXBuildFile; fileRef = 6AB4D99C2B1645F900A686F2 /* montgomery-test.c */; }; 6ABC2E842B231DFF00033B90 /* util.c in Sources */ = {isa = PBXBuildFile; fileRef = 6ABC2E832B231DFF00033B90 /* util.c */; }; 6ABC2E882B231E3D00033B90 /* reference-test.c in Sources */ = {isa = PBXBuildFile; fileRef = 6ABC2E862B231E3D00033B90 /* reference-test.c */; }; + 6AC553252B2E174900046AB7 /* montmodmult.cl in Sources */ = {isa = PBXBuildFile; fileRef = 6AC553242B2E174900046AB7 /* montmodmult.cl */; }; + 6AC553292B2E17C800046AB7 /* montmodmult.c in Sources */ = {isa = PBXBuildFile; fileRef = 6AC553282B2E17C800046AB7 /* montmodmult.c */; }; 6AF7487A2ADADEBD00D58E08 /* lib-gpu-verify.c in Sources */ = {isa = PBXBuildFile; fileRef = 6AF748792ADADEBD00D58E08 /* lib-gpu-verify.c */; }; 6AF748832ADADF4500D58E08 /* rsa-test.c in Sources */ = {isa = PBXBuildFile; fileRef = 6AF7487F2ADADF4500D58E08 /* rsa-test.c */; }; C3770EFD0E6F1138009A5A77 /* OpenCL.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = C3770EFC0E6F1138009A5A77 /* OpenCL.framework */; }; @@ -43,10 +44,8 @@ /* Begin PBXFileReference section */ 466E0F5F0C932E1A00ED01DB /* lib-gpu-verify */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = "lib-gpu-verify"; sourceTree = BUILT_PRODUCTS_DIR; }; 6A36F8882B0F938E00AB772D /* montgomery.cl */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.opencl; path = montgomery.cl; sourceTree = "<group>"; }; - 6A7914CB2B0CF320001EDCC1 /* gmp.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = gmp.c; path = ../source/gmp.c; sourceTree = "<group>"; }; 6A7914CC2B0CF320001EDCC1 /* montgomery.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = montgomery.h; path = ../source/montgomery.h; sourceTree = "<group>"; }; 6A7914CD2B0CF320001EDCC1 /* montgomery.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = montgomery.c; path = ../source/montgomery.c; sourceTree = "<group>"; }; - 6A7914CE2B0CF320001EDCC1 /* gmp.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = gmp.h; path = ../source/gmp.h; sourceTree = "<group>"; }; 6A8A795E2A89672700116D7D /* verify.cl */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.opencl; path = verify.cl; sourceTree = "<group>"; }; 6AA38E582B0A97FC00E85243 /* lib-gpu-generate */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = "lib-gpu-generate"; sourceTree = BUILT_PRODUCTS_DIR; }; 6AA38E5A2B0A97FC00E85243 /* main.c */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.c; path = main.c; sourceTree = "<group>"; }; @@ -57,6 +56,11 @@ 6ABC2E852B231E0400033B90 /* util.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; name = util.h; path = ../source/util.h; sourceTree = "<group>"; }; 6ABC2E862B231E3D00033B90 /* reference-test.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = "reference-test.c"; path = "../source/reference-test.c"; sourceTree = "<group>"; }; 6ABC2E872B231E3D00033B90 /* reference-test.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "reference-test.h"; path = "../source/reference-test.h"; sourceTree = "<group>"; }; + 6AC553242B2E174900046AB7 /* montmodmult.cl */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.opencl; path = montmodmult.cl; sourceTree = "<group>"; }; + 6AC553272B2E17C800046AB7 /* montmodmult.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; name = montmodmult.h; path = ../source/montmodmult.h; sourceTree = "<group>"; }; + 6AC553282B2E17C800046AB7 /* montmodmult.c */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.c; name = montmodmult.c; path = ../source/montmodmult.c; sourceTree = "<group>"; }; + 6AC5532A2B2E885200046AB7 /* gmp.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = gmp.c; path = ../source/gmp.c; sourceTree = "<group>"; }; + 6AC5532C2B2E889100046AB7 /* gmp.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; name = gmp.h; path = ../source/gmp.h; sourceTree = "<group>"; }; 6AF748792ADADEBD00D58E08 /* lib-gpu-verify.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = "lib-gpu-verify.c"; path = "../source/lib-gpu-verify.c"; sourceTree = "<group>"; }; 6AF7487F2ADADF4500D58E08 /* rsa-test.c */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.c; name = "rsa-test.c"; path = "../source/rsa-test.c"; sourceTree = "<group>"; }; 6AF748802ADADF4500D58E08 /* rsa-test.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = "rsa-test.h"; path = "../source/rsa-test.h"; sourceTree = "<group>"; }; @@ -105,8 +109,8 @@ isa = PBXGroup; children = ( 6AF748802ADADF4500D58E08 /* rsa-test.h */, - 6A7914CE2B0CF320001EDCC1 /* gmp.h */, 6A7914CC2B0CF320001EDCC1 /* montgomery.h */, + 6AC5532C2B2E889100046AB7 /* gmp.h */, 6ABC2E852B231E0400033B90 /* util.h */, 6ABC2E872B231E3D00033B90 /* reference-test.h */, 6AB4D99B2B1645F900A686F2 /* montgomery-test.h */, @@ -123,6 +127,16 @@ path = "lib-gpu-generate"; sourceTree = "<group>"; }; + 6AC553262B2E175500046AB7 /* pingpong */ = { + isa = PBXGroup; + children = ( + 6AC553242B2E174900046AB7 /* montmodmult.cl */, + 6AC553272B2E17C800046AB7 /* montmodmult.h */, + 6AC553282B2E17C800046AB7 /* montmodmult.c */, + ); + name = pingpong; + sourceTree = "<group>"; + }; C3770EF10E6F10BB009A5A77 /* Sources */ = { isa = PBXGroup; children = ( @@ -131,11 +145,12 @@ 6A36F8882B0F938E00AB772D /* montgomery.cl */, 6AF748792ADADEBD00D58E08 /* lib-gpu-verify.c */, 6AF7487F2ADADF4500D58E08 /* rsa-test.c */, - 6A7914CB2B0CF320001EDCC1 /* gmp.c */, + 6AC5532A2B2E885200046AB7 /* gmp.c */, 6A7914CD2B0CF320001EDCC1 /* montgomery.c */, 6AB4D99C2B1645F900A686F2 /* montgomery-test.c */, 6ABC2E832B231DFF00033B90 /* util.c */, 6ABC2E862B231E3D00033B90 /* reference-test.c */, + 6AC553262B2E175500046AB7 /* pingpong */, ); name = Sources; sourceTree = "<group>"; @@ -227,7 +242,8 @@ files = ( 6AB4D99D2B1645F900A686F2 /* montgomery-test.c in Sources */, 6ABC2E882B231E3D00033B90 /* reference-test.c in Sources */, - 6A99B06E2B1293DA0004E4B7 /* gmp.c in Sources */, + 6AC553252B2E174900046AB7 /* montmodmult.cl in Sources */, + 6AC553292B2E17C800046AB7 /* montmodmult.c in Sources */, 6AF7487A2ADADEBD00D58E08 /* lib-gpu-verify.c in Sources */, 6A8A795F2A89672700116D7D /* verify.cl in Sources */, 6ABC2E842B231DFF00033B90 /* util.c in Sources */, @@ -345,7 +361,10 @@ ); LIBRARY_SEARCH_PATHS_QUOTED_FOR_TARGET_1 = "\"$(SRCROOT)/../lib\" \"/usr/local/lib\""; MACOSX_DEPLOYMENT_TARGET = 13.5; - OTHER_LDFLAGS = "-lgcrypt"; + OTHER_LDFLAGS = ( + "-lgcrypt", + "-lgmp", + ); PRODUCT_NAME = "lib-gpu-verify"; SYSTEM_FRAMEWORK_SEARCH_PATHS = ""; USE_HEADERMAP = NO; @@ -372,7 +391,10 @@ ); LIBRARY_SEARCH_PATHS_QUOTED_FOR_TARGET_1 = "\"$(SRCROOT)/../lib\" \"/usr/local/lib\""; MACOSX_DEPLOYMENT_TARGET = 13.5; - OTHER_LDFLAGS = "-lgcrypt"; + OTHER_LDFLAGS = ( + "-lgcrypt", + "-lgmp", + ); PRODUCT_NAME = "lib-gpu-verify"; USE_HEADERMAP = NO; ZERO_LINK = NO; diff --git a/xcode/lib-gpu-verify.xcodeproj/project.xcworkspace/xcuserdata/cedriczwahlen.xcuserdatad/UserInterfaceState.xcuserstate b/xcode/lib-gpu-verify.xcodeproj/project.xcworkspace/xcuserdata/cedriczwahlen.xcuserdatad/UserInterfaceState.xcuserstate Binary files differ. diff --git a/xcode/lib-gpu-verify.xcodeproj/xcuserdata/cedriczwahlen.xcuserdatad/xcdebugger/Breakpoints_v2.xcbkptlist b/xcode/lib-gpu-verify.xcodeproj/xcuserdata/cedriczwahlen.xcuserdatad/xcdebugger/Breakpoints_v2.xcbkptlist @@ -4030,5 +4030,1506 @@ landmarkType = "9"> </BreakpointContent> </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "B5F8D09B-DBD6-4D27-9F18-0AA02E970656" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "21" + endingLineNumber = "21" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "3947C3E7-D4B7-443E-9C64-26FA73518839" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "115" + endingLineNumber = "115" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "3947C3E7-D4B7-443E-9C64-26FA73518839 - 18037aea005af134" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "92" + endingLineNumber = "92" + offsetFromSymbolStart = "928"> + </Location> + <Location + uuid = "3947C3E7-D4B7-443E-9C64-26FA73518839 - 18037aea005af115" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "91" + endingLineNumber = "91" + offsetFromSymbolStart = "1023"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "700C8EE6-BC1E-427F-B1C6-E018D10BDEC8" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "558" + endingLineNumber = "558" + landmarkName = "mont_modmult_tests()" + landmarkType = "9"> + <Locations> + <Location + uuid = "700C8EE6-BC1E-427F-B1C6-E018D10BDEC8 - 3a6dd6ae57b14a5e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "462" + endingLineNumber = "462" + offsetFromSymbolStart = "23"> + </Location> + <Location + uuid = "700C8EE6-BC1E-427F-B1C6-E018D10BDEC8 - 3a6dd6ae57b14a5e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "462" + endingLineNumber = "462" + offsetFromSymbolStart = "14"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "DB1A1F80-9BCD-4641-8418-19BE4BCBC405" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "100" + endingLineNumber = "100" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "605" + endingLineNumber = "605" + landmarkName = "mont_modmult_tests()" + landmarkType = "9"> + <Locations> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b149b8" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "492" + endingLineNumber = "492" + offsetFromSymbolStart = "437"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b149b8" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "492" + endingLineNumber = "492" + offsetFromSymbolStart = "473"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b14e3c" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "496" + endingLineNumber = "496" + offsetFromSymbolStart = "473"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b151d5" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "551" + endingLineNumber = "551" + offsetFromSymbolStart = "488"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b15742" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "562" + endingLineNumber = "562" + offsetFromSymbolStart = "488"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b15742" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "562" + endingLineNumber = "562" + offsetFromSymbolStart = "538"> + </Location> + <Location + uuid = "D2BA3F25-8290-42F4-8C03-1F8F1A3C497D - 3a6dd6ae57b15b85" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "mont_modmult_tests" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "599" + endingLineNumber = "599" + offsetFromSymbolStart = "538"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "877D065B-1222-4A88-A7A1-36AA5BAAA34B" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "226" + endingLineNumber = "226" + landmarkName = "modmult_opencl_prepare(info, state, x_buf, m_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "877D065B-1222-4A88-A7A1-36AA5BAAA34B - 7ea67c6850ea9357" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_prepare" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "194" + endingLineNumber = "194" + offsetFromSymbolStart = "108"> + </Location> + <Location + uuid = "877D065B-1222-4A88-A7A1-36AA5BAAA34B - 7ea67c6850ea90f0" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_prepare" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "199" + endingLineNumber = "199" + offsetFromSymbolStart = "104"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "0919DE7F-CA68-40D2-98C2-CDC334661F60" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "216" + endingLineNumber = "216" + landmarkName = "modmult_opencl_prepare(info, state, x_buf, m_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "4B27D588-7D34-4BD1-A24D-4C6E8D39B984" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "440" + endingLineNumber = "440" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "4B27D588-7D34-4BD1-A24D-4C6E8D39B984 - b46ebf1cc4a0b9c0" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "346" + endingLineNumber = "346" + offsetFromSymbolStart = "269"> + </Location> + <Location + uuid = "4B27D588-7D34-4BD1-A24D-4C6E8D39B984 - b46ebf1cc4a0b9c0" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "346" + endingLineNumber = "346" + offsetFromSymbolStart = "259"> + </Location> + <Location + uuid = "4B27D588-7D34-4BD1-A24D-4C6E8D39B984 - b46ebf1cc4a0b9c0" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "346" + endingLineNumber = "346" + offsetFromSymbolStart = "256"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "800CDD46-DF8C-4E7E-A8E0-2BC47B0E60D2" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "228" + endingLineNumber = "228" + landmarkName = "modmult_opencl_prepare(info, state, x_buf, m_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "800CDD46-DF8C-4E7E-A8E0-2BC47B0E60D2 - 7ea67c6850ea90d3" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_prepare" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "198" + endingLineNumber = "198" + offsetFromSymbolStart = "119"> + </Location> + <Location + uuid = "800CDD46-DF8C-4E7E-A8E0-2BC47B0E60D2 - 7ea67c6850ea90be" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_prepare" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "201" + endingLineNumber = "201" + offsetFromSymbolStart = "116"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "388" + endingLineNumber = "388" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0ba5c" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "358" + endingLineNumber = "358" + offsetFromSymbolStart = "361"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0ba7d" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "357" + endingLineNumber = "357" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0ba3f" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "359" + endingLineNumber = "359" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0ba5c" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "358" + endingLineNumber = "358" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0ba1e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "360" + endingLineNumber = "360" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bbd0" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "362" + endingLineNumber = "362" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bb75" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "365" + endingLineNumber = "365" + offsetFromSymbolStart = "351"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a041ce" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "408" + endingLineNumber = "408" + offsetFromSymbolStart = "369"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0be9b" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "387" + endingLineNumber = "387" + offsetFromSymbolStart = "394"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bd45" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "381" + endingLineNumber = "381" + offsetFromSymbolStart = "370"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bed9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "385" + endingLineNumber = "385" + offsetFromSymbolStart = "370"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bed9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "385" + endingLineNumber = "385" + offsetFromSymbolStart = "374"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0bed9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "385" + endingLineNumber = "385" + offsetFromSymbolStart = "398"> + </Location> + <Location + uuid = "84A684AB-D668-4B78-9FD1-2540A08574E3 - b46ebf1cc4a0be7a" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "388" + endingLineNumber = "388" + offsetFromSymbolStart = "398"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "FAC6BA4D-8703-4276-BEAA-7EA43AF63D0F" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "326" + endingLineNumber = "326" + landmarkName = "modmult_opencl_exec_kernel(info, state)" + landmarkType = "9"> + <Locations> + <Location + uuid = "FAC6BA4D-8703-4276-BEAA-7EA43AF63D0F - 22ed8a6bec85ee99" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "298" + endingLineNumber = "298" + offsetFromSymbolStart = "28"> + </Location> + <Location + uuid = "FAC6BA4D-8703-4276-BEAA-7EA43AF63D0F - 22ed8a6bec85ee99" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "298" + endingLineNumber = "298" + offsetFromSymbolStart = "32"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "323" + endingLineNumber = "323" + landmarkName = "modmult_opencl_exec_kernel(info, state)" + landmarkType = "9"> + <Locations> + <Location + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802 - 22ed8a6bec85ee15" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "294" + endingLineNumber = "294" + offsetFromSymbolStart = "24"> + </Location> + <Location + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802 - 22ed8a6bec85eed7" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "296" + endingLineNumber = "296" + offsetFromSymbolStart = "24"> + </Location> + <Location + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802 - 22ed8a6bec85e8c6" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "311" + endingLineNumber = "311" + offsetFromSymbolStart = "24"> + </Location> + <Location + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802 - 22ed8a6bec85e487" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "344" + endingLineNumber = "344" + offsetFromSymbolStart = "24"> + </Location> + <Location + uuid = "5B1B4488-A19F-4A97-926D-1263BFEFF802 - 22ed8a6bec85ea71" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_exec_kernel" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "322" + endingLineNumber = "322" + offsetFromSymbolStart = "24"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "E19DB0AE-EBC4-42E6-A48E-0A5B64A9CF56" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "73" + endingLineNumber = "73" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "5AA79044-F9D9-4539-870E-8082CCF4F458" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "532" + endingLineNumber = "532" + landmarkName = "modmult_gpu_execute(info, state, x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "5AA79044-F9D9-4539-870E-8082CCF4F458 - 30fdc229490fff9e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_gpu_execute" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "477" + endingLineNumber = "477" + offsetFromSymbolStart = "117"> + </Location> + <Location + uuid = "5AA79044-F9D9-4539-870E-8082CCF4F458 - 30fdc229490fffdc" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_gpu_execute" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "479" + endingLineNumber = "479" + offsetFromSymbolStart = "117"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "29FF3D84-E5F9-4429-8A53-756F9A7E5AD4" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "259" + endingLineNumber = "259" + landmarkName = "modmult_opencl_prepare(info, state, x_buf, m_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "CCF0BFD9-35C8-47D4-A9DE-665DC105BDF8" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "137" + endingLineNumber = "137" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "CCF0BFD9-35C8-47D4-A9DE-665DC105BDF8 - 18037aea005af767" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "137" + endingLineNumber = "137" + offsetFromSymbolStart = "1406"> + </Location> + <Location + uuid = "CCF0BFD9-35C8-47D4-A9DE-665DC105BDF8 - 18037aea005af725" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "139" + endingLineNumber = "139" + offsetFromSymbolStart = "1406"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "854BEA05-AC22-4D30-B923-D574599C490D" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "154" + endingLineNumber = "154" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "854BEA05-AC22-4D30-B923-D574599C490D - 18037aea005af4a9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "135" + endingLineNumber = "135" + offsetFromSymbolStart = "1465"> + </Location> + <Location + uuid = "854BEA05-AC22-4D30-B923-D574599C490D - 18037aea005af63e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "146" + endingLineNumber = "146" + offsetFromSymbolStart = "1590"> + </Location> + <Location + uuid = "854BEA05-AC22-4D30-B923-D574599C490D - 18037aea005af640" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "144" + endingLineNumber = "144" + offsetFromSymbolStart = "1665"> + </Location> + <Location + uuid = "854BEA05-AC22-4D30-B923-D574599C490D - 18037aea005ac936" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "154" + endingLineNumber = "154" + offsetFromSymbolStart = "1730"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "56542C6C-ED16-48E5-A345-C0E798659638" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "378" + endingLineNumber = "378" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "56542C6C-ED16-48E5-A345-C0E798659638 - b46ebf1cc4a0ba5c" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "358" + endingLineNumber = "358" + offsetFromSymbolStart = "315"> + </Location> + <Location + uuid = "56542C6C-ED16-48E5-A345-C0E798659638 - b46ebf1cc4a0bcc9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "369" + endingLineNumber = "369" + offsetFromSymbolStart = "315"> + </Location> + <Location + uuid = "56542C6C-ED16-48E5-A345-C0E798659638 - b46ebf1cc4a0bb54" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "366" + endingLineNumber = "366" + offsetFromSymbolStart = "315"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "A0B20FE3-FB60-4D60-9B51-300DE8543447" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "364" + endingLineNumber = "364" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "A0B20FE3-FB60-4D60-9B51-300DE8543447 - b46ebf1cc4a0b84c" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "342" + endingLineNumber = "342" + offsetFromSymbolStart = "148"> + </Location> + <Location + uuid = "A0B20FE3-FB60-4D60-9B51-300DE8543447 - b46ebf1cc4a0baf9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "353" + endingLineNumber = "353" + offsetFromSymbolStart = "148"> + </Location> + <Location + uuid = "A0B20FE3-FB60-4D60-9B51-300DE8543447 - b46ebf1cc4a0b944" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "350" + endingLineNumber = "350" + offsetFromSymbolStart = "148"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "175" + endingLineNumber = "175" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005ac82e" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "162" + endingLineNumber = "162" + offsetFromSymbolStart = "1892"> + </Location> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005acb83" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "173" + endingLineNumber = "173" + offsetFromSymbolStart = "2017"> + </Location> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005acb07" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "169" + endingLineNumber = "169" + offsetFromSymbolStart = "2078"> + </Location> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005acb07" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "169" + endingLineNumber = "169" + offsetFromSymbolStart = "2075"> + </Location> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005acb07" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "169" + endingLineNumber = "169" + offsetFromSymbolStart = "2072"> + </Location> + <Location + uuid = "6B6DD1A1-289E-455E-B49C-DDF8158E3B10 - 18037aea005aca41" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "175" + endingLineNumber = "175" + offsetFromSymbolStart = "2194"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "370" + endingLineNumber = "370" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0ba9a" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "356" + endingLineNumber = "356" + offsetFromSymbolStart = "272"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bfd1" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "393" + endingLineNumber = "393" + offsetFromSymbolStart = "272"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bf93" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "395" + endingLineNumber = "395" + offsetFromSymbolStart = "272"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bf55" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "397" + endingLineNumber = "397" + offsetFromSymbolStart = "272"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bf55" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "397" + endingLineNumber = "397" + offsetFromSymbolStart = "290"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0be1f" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "391" + endingLineNumber = "391" + offsetFromSymbolStart = "290"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bcc9" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "369" + endingLineNumber = "369" + offsetFromSymbolStart = "306"> + </Location> + <Location + uuid = "5C0ACEE0-4246-4CA2-9B7C-A5B3E417DD3E - b46ebf1cc4a0bbb3" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "modmult_opencl_results" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "363" + endingLineNumber = "363" + offsetFromSymbolStart = "282"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "1D13B1BF-088A-44A4-B036-D2267F8385C5" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "133" + endingLineNumber = "133" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + <Locations> + <Location + uuid = "1D13B1BF-088A-44A4-B036-D2267F8385C5 - 18037aea005af42d" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "131" + endingLineNumber = "131" + offsetFromSymbolStart = "1360"> + </Location> + <Location + uuid = "1D13B1BF-088A-44A4-B036-D2267F8385C5 - 18037aea005af4eb" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + symbolName = "montmodmult_pairs_from_files" + moduleName = "lib-gpu-verify" + usesParentBreakpointCondition = "Yes" + urlString = "file:///Users/cedriczwahlen/libgpuverify/source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "133" + endingLineNumber = "133" + offsetFromSymbolStart = "1375"> + </Location> + </Locations> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "FB38C9CB-9FB8-4B84-9CE2-7184FCD7F326" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montgomery.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "144" + endingLineNumber = "144" + landmarkName = "mont_prepare(b, e, m, r, r_1, ni, M, x)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "EC8E40B9-5869-4CD4-A602-C7739D7BFF03" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/rsa-test.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "251" + endingLineNumber = "251" + landmarkName = "opencl_pairs_from_files(bases, b_len, exponents, e_len, moduli, m_len, signatures, s_len, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "E4BEB202-36D5-4E45-9886-88D8B2A6D37B" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "392" + endingLineNumber = "392" + landmarkName = "modmult_opencl_results(info, state, timed, msg_buf, r_1_buf, n_buf, s_buf, mod_buf, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "EBE3EB24-9B9A-43BD-850A-460559601A71" + shouldBeEnabled = "No" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "168" + endingLineNumber = "168" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> + <BreakpointProxy + BreakpointExtensionID = "Xcode.Breakpoint.FileBreakpoint"> + <BreakpointContent + uuid = "7E182A4C-319B-4622-9FD0-18C77CB42D7B" + shouldBeEnabled = "Yes" + ignoreCount = "0" + continueAfterRunningActions = "No" + filePath = "../source/montmodmult.c" + startingColumnNumber = "9223372036854775807" + endingColumnNumber = "9223372036854775807" + startingLineNumber = "155" + endingLineNumber = "155" + landmarkName = "montmodmult_pairs_from_files(x_buf, m_buf, r_1_buf, n_buf, ni_buf, msg_buf, exp_buf, mod_buf, s_buf, pks, n)" + landmarkType = "9"> + </BreakpointContent> + </BreakpointProxy> </Breakpoints> </Bucket> diff --git a/xcode/montmodmult.cl b/xcode/montmodmult.cl @@ -0,0 +1,375 @@ + + +typedef ulong gpu_register; + +#define BITS_PER_DIGIT (sizeof(gpu_register) * 8) +#define HIBITMASK 0x80000000UL + + +int mult(gpu_register p[2], gpu_register x, gpu_register y) +{ + + + + + /* Use a 64-bit temp for product */ + //ulong t = (ulong)x * (ulong)y; + /* then split into two parts */ + p[1] = mul_hi(x,y); + p[0] = x * y; + + return 0; +} + + +int multiply(__global gpu_register *w, __global gpu_register *u, __global gpu_register *v, size_t ndigits) +{ + /* Computes product w = u * v + where u, v are multiprecision integers of ndigits each + and w is a multiprecision integer of 2*ndigits + + Ref: Knuth Vol 2 Ch 4.3.1 p 268 Algorithm M. + */ + + gpu_register k, t[2]; + size_t i, j, m, n; + + //assert(w != u && w != v); + + m = n = ndigits; + + /* Step M1. Initialise */ + for (i = 0; i < 2 * m; i++) + w[i] = 0; + + for (j = 0; j < n; j++) + { + /* Step M2. Zero multiplier? */ + if (v[j] == 0) + { + w[j + m] = 0; + } + else + { + /* Step M3. Initialise i */ + k = 0; + for (i = 0; i < m; i++) + { + /* Step M4. Multiply and add */ + /* t = u_i * v_j + w_(i+j) + k */ + mult(t, u[i], v[j]); + + t[0] += k; + if (t[0] < k) + t[1]++; + t[0] += w[i+j]; + if (t[0] < w[i+j]) + t[1]++; + + w[i+j] = t[0]; + k = t[1]; + } + /* Step M5. Loop on i, set w_(j+m) = k */ + w[j+m] = k; + } + } /* Step M6. Loop on j */ + + return 0; +} + + +int square(__global gpu_register *w, __global gpu_register *x, size_t ndigits) +/* New in Version 2.0 */ +{ + /* Computes square w = x * x + where x is a multiprecision integer of ndigits + and w is a multiprecision integer of 2*ndigits + + Ref: Menezes p596 Algorithm 14.16 with errata. + */ + + gpu_register k, p[2], u[2], cbit, carry; + size_t i, j, t, i2, cpos; + + t = ndigits; + + /* 1. For i from 0 to (2t-1) do: w_i = 0 */ + i2 = t << 1; + for (i = 0; i < i2; i++) + w[i] = 0; + + carry = 0; + cpos = i2-1; + /* 2. For i from 0 to (t-1) do: */ + for (i = 0; i < t; i++) + { + /* 2.1 (uv) = w_2i + x_i * x_i, w_2i = v, c = u + Careful, w_2i may be double-prec + */ + i2 = i << 1; /* 2*i */ + mult(p, x[i], x[i]); + p[0] += w[i2]; + if (p[0] < w[i2]) + p[1]++; + k = 0; /* p[1] < b, so no overflow here */ + if (i2 == cpos && carry) + { + p[1] += carry; + if (p[1] < carry) + k++; + carry = 0; + } + w[i2] = p[0]; + u[0] = p[1]; + u[1] = k; + + /* 2.2 for j from (i+1) to (t-1) do: + (uv) = w_{i+j} + 2x_j * x_i + c, + w_{i+j} = v, c = u, + u is double-prec + w_{i+j} is dbl if [i+j] == cpos + */ + k = 0; + for (j = i+1; j < t; j++) + { + /* p = x_j * x_i */ + mult(p, x[j], x[i]); + /* p = 2p <=> p <<= 1 */ + cbit = (p[0] & HIBITMASK) != 0; + k = (p[1] & HIBITMASK) != 0; + p[0] <<= 1; + p[1] <<= 1; + p[1] |= cbit; + /* p = p + c */ + p[0] += u[0]; + if (p[0] < u[0]) + { + p[1]++; + if (p[1] == 0) + k++; + } + p[1] += u[1]; + if (p[1] < u[1]) + k++; + /* p = p + w_{i+j} */ + p[0] += w[i+j]; + if (p[0] < w[i+j]) + { + p[1]++; + if (p[1] == 0) + k++; + } + if ((i+j) == cpos && carry) + { /* catch overflow from last round */ + p[1] += carry; + if (p[1] < carry) + k++; + carry = 0; + } + /* w_{i+j} = v, c = u */ + w[i+j] = p[0]; + u[0] = p[1]; + u[1] = k; + } + /* 2.3 w_{i+t} = u */ + w[i+t] = u[0]; + /* remember overflow in w_{i+t} */ + carry = u[1]; + cpos = i+t; + } + + /* (NB original step 3 deleted in Menezes errata) */ + + /* Return w */ + + return 0; +} + +gpu_register shift_r(__global gpu_register *a, __global gpu_register *b, size_t shift, size_t ndigits) +{ /* Computes a = b >> shift */ + /* [v2.1] Modified to cope with shift > BITS_PERDIGIT */ + + gpu_register carry = 0; + + while (1) { + + size_t i, y, nw, bits; + gpu_register mask, tempCarry, nextcarry; + + /* Do we shift whole digits? */ + if (shift >= BITS_PER_DIGIT) + { + nw = shift / BITS_PER_DIGIT; + for (i = 0; i < ndigits; i++) + { + if ((i+nw) < ndigits) + a[i] = b[i+nw]; + else + a[i] = 0; + } + /* Call again to shift bits inside digits */ + bits = shift % BITS_PER_DIGIT; + tempCarry = b[nw-1] >> bits; + if (bits) + carry |= tempCarry; + return carry; + } + else + { + bits = shift; + } + + /* Construct mask to set low bits */ + /* (thanks to Jesse Chisholm for suggesting this improved technique) */ + mask = ~(~(gpu_register)0 << bits); + + y = BITS_PER_DIGIT - bits; + carry = 0; + i = ndigits; + while (i--) + { + nextcarry = (b[i] & mask) << y; + a[i] = b[i] >> bits | carry; + carry = nextcarry; + } + + return carry; + + } +} + +/* + determine by how much to divide / shift + from most significant of double size number, look for first high bit. + */ + +/* +gpu_register shift_by(__global gpu_register *r, int n) { + + gpu_register u = 8 * sizeof(gpu_register); + + for (int i = n-1; i >= (n / 2); i--) + { + if (r[i] != 0) { + int k = ceil(log2((float)r[i] + (float)1)); + gpu_register total = k + i * u; + + return total - (u * (n / 2)); + } + } + + return 0; +} +*/ +gpu_register add(__global gpu_register *w, __global gpu_register *u, __global gpu_register *v, size_t ndigits) +{ + /* Calculates w = u + v + where w, u, v are multiprecision integers of ndigits each + Returns carry if overflow. Carry = 0 or 1. + + Ref: Knuth Vol 2 Ch 4.3.1 p 266 Algorithm A. + */ + + gpu_register k; + size_t j; + + //assert(w != v); + + /* Step A1. Initialise */ + k = 0; + + for (j = 0; j < ndigits; j++) + { + /* Step A2. Add digits w_j = (u_j + v_j + k) + Set k = 1 if carry (overflow) occurs + */ + w[j] = u[j] + k; + if (w[j] < k) + k = 1; + else + k = 0; + + w[j] += v[j]; + if (w[j] < v[j]) + k++; + + } /* Step A3. Loop on j */ + + return k; /* w_n = k */ +} + +void equal(__global gpu_register *a, __global gpu_register *b, size_t ndigits) +{ /* Sets a = b */ + size_t i; + + for (i = 0; i < ndigits; i++) + { + a[i] = b[i]; + } +} + +void erase_above(__global gpu_register *a, size_t n) +{ + + for (int i = n-1; i >= (n / 2); i--) + { + a[i] = 0; + } + +} + +int testbit(gpu_register e, int i) { + + return (e & (0x1 << (gpu_register)i) ) > 0 ? 1 : 0; + +} + +__kernel + void mont(__global gpu_register *x, __global gpu_register *m, + __global gpu_register *res, __global gpu_register *n, // res is not needed, we write the result in x + __global gpu_register *ni, __global gpu_register *exp, + __global gpu_register *tmp_1, __global gpu_register *tmp_2, + __global gpu_register *pks//, unsigned long count // invalid is not needed either + ) +{ + + size_t i = get_global_id(0); + + int offs = 0; // the size of one number + + int pk = 0; // das funktioniert so nicht – die globale id wird grösser, ohne dass noch weitere elemente in pks sind... + + +// while (1) { +// if (pks[pk] >= i) +// break; +// pk++; +// } + + + int k = ceil(log2((float)exp[pk] + (float)1)); + + //printf((char __constant *)"%i\n", k); + + barrier(CLK_GLOBAL_MEM_FENCE | CLK_LOCAL_MEM_FENCE); + + equal(tmp_2, x, 32); + + int z = 0; + + for (int j = k - 1; j >= 0; j--) { + + square(tmp_1,tmp_2,32); + erase_above(tmp_1, 64); + //printf((char __constant *)"sqr\n"); + + if (testbit(exp[pk], j)) { + multiply(tmp_1,tmp_2,m,32); + erase_above(tmp_1, 64); + //printf((char __constant *)"mul\n"); + } + } + + equal(res, tmp_1, 32); + +} diff --git a/xcode/verify.cl b/xcode/verify.cl @@ -1240,7 +1240,8 @@ __kernel void several(__global DIGIT_T* x, __global const unsigned long *s_len, int ndigits = max( max( n_len[pk] - (pk == 0 ? 0 : n_len[pk - 1]), mm_len[index] - (index == 0 ? 0 : mm_len[index - 1]) ), s_len[index] - (index == 0 ? 0 : s_len[index - 1]) ); int edigits = e_len[pk] - (pk == 0 ? 0 : e_len[pk - 1] ); - + + //printf((char __constant *)"%i\n", ndigits); // the result is copied in here, compare it to mm DIGIT_T yout[MAX_ALLOC_SIZE * 2]; @@ -1260,9 +1261,9 @@ __kernel void several(__global DIGIT_T* x, __global const unsigned long *s_len, window_mm = &mm[index == 0 ? 0 : (mm_len[index - 1])]; - __private DIGIT_T t1[MAX_ALLOC_SIZE *2]; - __private DIGIT_T t2[MAX_ALLOC_SIZE *2]; - __private DIGIT_T y[MAX_ALLOC_SIZE *2]; + __private DIGIT_T t1[MAX_ALLOC_SIZE *2]; // obsolete? + __private DIGIT_T t2[MAX_ALLOC_SIZE *2]; // obsolete? + __private DIGIT_T y[MAX_ALLOC_SIZE *2]; // obsolete? n = mpSizeof_g(window_e, edigits); /* Catch e==0 => x^0=1 */