LAMMP 4.1.0
Lamina High-Precision Arithmetic Library
载入中...
搜索中...
未找到
sqr_toom2.c
浏览该文件的文档.
1/*
2 * LAMMP - Copyright (C) 2025-2026 HJimmyK(Jericho Knox)
3 * This file is part of lammp, under the GNU LGPL v2 license.
4 * See LICENSE in the project root for the full license text.
5 */
6
7#include "../../include/lammp/impl/tmp_alloc.h"
8#include "../../include/lammp/lmmpn.h"
9
10/*
11Evaluate in: -1, 0, +inf
12
13 <-s--><--n-->
14 |-a1-|--a0--|
15
16v0 = a0 ^2 # A(0)^2
17vm1 = (a0-a1)^2 # A(-1)^2
18vinf= a1 ^2 # A(inf)^2
19*/
20
21void lmmp_sqr_toom2_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na) {
22 lmmp_param_assert(na > 0);
23 lmmp_param_assert(dst != NULL);
24 lmmp_param_assert(numa!= NULL);
26 mp_size_t s = na >> 1, n = na - s;
28 mp_slimb_t cy, cy2;
29
30#define a0 numa
31#define a1 (numa + n)
32#define asm1 dst
33
34 if (s == n) {
35 if (lmmp_cmp_(a0, a1, n) < 0)
36 lmmp_sub_n_(asm1, a1, a0, n);
37 else
38 lmmp_sub_n_(asm1, a0, a1, n);
39 } else { // s==n-1
40 if (a0[s] == 0 && lmmp_cmp_(a0, a1, s) < 0) {
41 lmmp_sub_n_(asm1, a1, a0, s);
42 asm1[s] = 0;
43 } else
44 asm1[s] = a0[s] - lmmp_sub_n_(asm1, a0, a1, s);
45 }
46
47 lmmp_sqr_(vm1, asm1, n);
48
49#undef asm1
50#define v0 dst
51#define vinf (dst + 2 * n)
52
53 lmmp_sqr_(v0, a0, n);
54
55 lmmp_sqr_(vinf, a1, s);
56
57 cy = lmmp_add_n_(dst + 2 * n, v0 + n, vinf, n);
58 cy2 = cy + lmmp_add_n_(dst + n, dst + 2 * n, v0, n);
59 cy += lmmp_add_(dst + 2 * n, dst + 2 * n, n, vinf + n, s + s - n);
60
61 cy -= lmmp_sub_n_(dst + n, dst + n, vm1, 2 * n);
62
63 // no overflow.
64 lmmp_inc_1(dst + 2 * n, cy2);
65
66 if (cy < 0)
67 lmmp_dec(dst + 3 * n);
68 else
69 lmmp_inc_1(dst + 3 * n, cy);
71}
mp_limb_t * mp_ptr
Definition lmmp.h:215
uint64_t mp_size_t
Definition lmmp.h:212
int64_t mp_slimb_t
Definition lmmp.h:213
const mp_limb_t * mp_srcptr
Definition lmmp.h:216
uint64_t mp_limb_t
Definition lmmp.h:211
#define lmmp_param_assert(x)
Definition lmmp.h:398
static mp_limb_t lmmp_add_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
大数加法静态内联函数 [dst,na]=[numa,na]+[numb,nb]
Definition lmmpn.h:1058
static int lmmp_cmp_(mp_srcptr numa, mp_srcptr numb, mp_size_t n)
大数比较函数(内联)
Definition lmmpn.h:1004
#define lmmp_dec(p)
大数减1宏(预期无借位)
Definition lmmpn.h:973
void lmmp_sqr_(mp_ptr dst, mp_srcptr numa, mp_size_t na)
大数平方操作 [dst,2*na] = [numa,na]^2
Definition sqr.c:10
mp_limb_t lmmp_sub_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
无借位的n位减法 [dst,n] = [numa,n] - [numb,n]
Definition sub_n.c:70
#define lmmp_inc_1(p, inc)
大数加指定值宏(预期无进位)
Definition lmmpn.h:958
mp_limb_t lmmp_add_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
无进位的n位加法 [dst,n] = [numa,n] + [numb,n]
Definition add_n.c:71
#define vm1
#define v0
#define a0
#define a1
#define asm1
#define vinf
void lmmp_sqr_toom2_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na)
Definition sqr_toom2.c:21
#define SALLOC_TYPE(n, type)
Definition tmp_alloc.h:87
#define TEMP_S_DECL
Definition tmp_alloc.h:76
#define TEMP_S_FREE
Definition tmp_alloc.h:105