LAMMP 4.1.0
Lamina High-Precision Arithmetic Library
载入中...
搜索中...
未找到
sqr_toom3.c
浏览该文件的文档.
1/*
2 * LAMMP - Copyright (C) 2025-2026 HJimmyK(Jericho Knox)
3 * This file is part of lammp, under the GNU LGPL v2 license.
4 * See LICENSE in the project root for the full license text.
5 */
6
7#include "../../include/lammp/lmmpn.h"
8#include "../../include/lammp/impl/toom_interp.h"
9
10/*
11Evaluate in: -1, 0, +1, +2, +inf
12
13 <-s--><--n--><--n-->
14 |-a2-|--a1--|--a0--|
15
16v0 = a0 *^2 # A(0)^2
17v1 = (a0+ a1+ a2)*^2 # A(1)^2 ah <= 2
18vm1 = (a0- a1+ a2)*^2 # A(-1)^2 |ah| <= 1
19v2 = (a0+2a1+4a2)*^2 # A(2)^2 ah <= 6
20vinf= a2 *^2 # A(inf)^2
21*/
22
23void lmmp_sqr_toom3_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na) {
24 lmmp_param_assert(na > 0);
25 lmmp_param_assert(numa != NULL);
26 lmmp_param_assert(dst != NULL);
28 mp_size_t n = (na + 2) / 3, s = na - 2 * n;
29 mp_limb_t cy, cy2, vinf0, am1h;
30 mp_limb_t* restrict tp = SALLOC_TYPE(4 * n + 4, mp_limb_t);
31
32#define a0 numa
33#define a1 (numa + n)
34#define a2 (numa + 2 * n)
35
36#define v0 dst //[dst,2*n]
37#define v1 (dst + 2 * n) //[dst+2*n,2*n+1]
38#define vinf (dst + 4 * n) //[dst+4*n,s+t]
39#define vm1 tp //[tp,2*n+1]
40#define v2 (tp + 2 * n + 2) //[tp+2*n+2,2*n+1]
41
42#define am1 (dst) //[dst,n]
43#define ap1 tp //[tp,n+1]
44#define ap2 ap1 // same space
45
46 // ap1, am1
47 cy = lmmp_add_(ap1, a0, n, a2, s);
48 if (cy == 0 && lmmp_cmp_(ap1, a1, n) < 0) {
49 cy = lmmp_add_n_sub_n_(ap1, am1, a1, ap1, n);
50 ap1[n] = cy >> 1;
51 am1h = 0;
52 } else {
53 cy2 = lmmp_add_n_sub_n_(ap1, am1, ap1, a1, n);
54 ap1[n] = cy + (cy2 >> 1);
55 am1h = cy - (cy2 & 1);
56 }
57
58 // vinf
59 lmmp_sqr_(vinf, a2, s);
60 vinf0 = vinf[0]; // overlap with v1
61 cy = vinf[1]; // overlap with v1
62
63 // v1
64 lmmp_sqr_(v1, ap1, n + 1);
65 vinf[1] = cy; // restore, since v1[2*n+1]==0.
66
67 // ap2
68 cy = lmmp_addshl1_n_(ap2, a1, a2, s);
69 if (s != n)
70 cy = lmmp_add_1_(ap2 + s, a1 + s, n - s, cy);
71 cy = 2 * cy + lmmp_addshl1_n_(ap2, a0, ap2, n);
72 ap2[n] = cy;
73
74 // v2
75 lmmp_sqr_(v2, ap2, n + 1);
76
77 // vm1
78 lmmp_sqr_(vm1, am1, n);
79 if (am1h)
80 am1h += lmmp_addshl1_n_(vm1 + n, vm1 + n, am1, n);
81 vm1[2 * n] = am1h;
82
83 // v0
84 lmmp_sqr_(v0, a0, n);
85
86 lmmp_toom_interp5_(dst, v2, vm1, n, s + s, 0, vinf0);
88}
mp_limb_t * mp_ptr
Definition lmmp.h:215
uint64_t mp_size_t
Definition lmmp.h:212
const mp_limb_t * mp_srcptr
Definition lmmp.h:216
uint64_t mp_limb_t
Definition lmmp.h:211
#define lmmp_param_assert(x)
Definition lmmp.h:398
static mp_limb_t lmmp_add_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
大数加法静态内联函数 [dst,na]=[numa,na]+[numb,nb]
Definition lmmpn.h:1058
static int lmmp_cmp_(mp_srcptr numa, mp_srcptr numb, mp_size_t n)
大数比较函数(内联)
Definition lmmpn.h:1004
static mp_limb_t lmmp_add_1_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_limb_t x)
大数加单精度数静态内联函数 [dst,na]=[numa,na]+x
Definition lmmpn.h:1111
void lmmp_sqr_(mp_ptr dst, mp_srcptr numa, mp_size_t na)
大数平方操作 [dst,2*na] = [numa,na]^2
Definition sqr.c:10
mp_limb_t lmmp_addshl1_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
加法结合左移1位操作 [dst,n] = [numa,n] + ([numb,n] << 1)
Definition shl.c:56
mp_limb_t lmmp_add_n_sub_n_(mp_ptr dsta, mp_ptr dstb, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
同时执行n位加法和减法 ([dsta,n],[dstb,n]) = ([numa,n]+[numb,n],[numa,n]-[numb,n])
Definition add_n_sub_n.c:10
#define tp
#define ap2
#define v0
#define am1
#define ap1
#define v2
#define vm1
#define a2
#define a0
#define a1
#define vinf
#define v1
void lmmp_sqr_toom3_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na)
Definition sqr_toom3.c:23
#define SALLOC_TYPE(n, type)
Definition tmp_alloc.h:87
#define TEMP_S_DECL
Definition tmp_alloc.h:76
#define TEMP_S_FREE
Definition tmp_alloc.h:105
void lmmp_toom_interp5_(mp_ptr dst, mp_ptr v2, mp_ptr vm1, mp_size_t n, mp_size_t spt, int vm1_neg, mp_limb_t vinf0)
Toom插值计算(5点插值),用于Toom-33和Toom-42乘法算法