LAMMP 4.1.0
Lamina High-Precision Arithmetic Library
载入中...
搜索中...
未找到
mul_toom22.c
浏览该文件的文档.
1/*
2 * LAMMP - Copyright (C) 2025-2026 HJimmyK(Jericho Knox)
3 * This file is part of lammp, under the GNU LGPL v2 license.
4 * See LICENSE in the project root for the full license text.
5 */
6
7#include "../../include/lammp/impl/tmp_alloc.h"
8#include "../../include/lammp/lmmpn.h"
9
10/*
11Evaluate in: -1, 0, +inf
12
13 <-s--><--n-->
14 |-a1-|--a0--|
15 |b1-|--b0--|
16 <-t-><--n-->
17
18v0 = a0 * b0 # A(0)*B(0)
19vm1 = (a0-a1)*(b0-b1) # A(-1)*B(-1)
20vinf= a1 * b1 # A(inf)*B(inf)
21*/
22
23void lmmp_mul_toom22_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na, mp_srcptr restrict numb, mp_size_t nb) {
24 lmmp_param_assert(nb >= 5);
25 lmmp_param_assert(na >= nb);
26 lmmp_param_assert(4 * na <= 5 * nb);
28 mp_size_t s = na >> 1, n = na - s, t = nb - n;
29 mp_limb_t* restrict vm1 = SALLOC_TYPE(2 * n, mp_limb_t);
30 int vm1_neg = 0;
31 mp_slimb_t cy, cy2;
32
33#define a0 numa
34#define a1 (numa + n)
35#define b0 numb
36#define b1 (numb + n)
37#define asm1 dst
38#define bsm1 (dst + n)
39
40 if (s == n) {
41 if (lmmp_cmp_(a0, a1, n) < 0) {
42 lmmp_sub_n_(asm1, a1, a0, n);
43 vm1_neg = 1;
44 } else
45 lmmp_sub_n_(asm1, a0, a1, n);
46 } else { // s==n-1
47 if (a0[s] == 0 && lmmp_cmp_(a0, a1, s) < 0) {
48 lmmp_sub_n_(asm1, a1, a0, s);
49 asm1[s] = 0;
50 vm1_neg = 1;
51 } else
52 asm1[s] = a0[s] - lmmp_sub_n_(asm1, a0, a1, s);
53 }
54
55 if (t == n) {
56 if (lmmp_cmp_(b0, b1, n) < 0) {
57 lmmp_sub_n_(bsm1, b1, b0, n);
58 vm1_neg ^= 1;
59 } else
60 lmmp_sub_n_(bsm1, b0, b1, n);
61 } else {
62 if (lmmp_zero_q_(b0 + t, n - t) && lmmp_cmp_(b0, b1, t) < 0) {
63 lmmp_sub_n_(bsm1, b1, b0, t);
64 lmmp_zero(bsm1 + t, n - t);
65 vm1_neg ^= 1;
66 } else
67 lmmp_sub_(bsm1, b0, n, b1, t);
68 }
69
71
72#undef asm1
73#undef bsm1
74#define v0 dst
75#define vinf (dst + 2 * n)
76
77 lmmp_mul_n_(v0, a0, b0, n);
78
79 lmmp_mul_(vinf, a1, s, b1, t);
80
81 cy = lmmp_add_n_(dst + 2 * n, v0 + n, vinf, n);
82 cy2 = cy + lmmp_add_n_(dst + n, dst + 2 * n, v0, n);
83 cy += lmmp_add_(dst + 2 * n, dst + 2 * n, n, vinf + n, s + t - n);
84
85 if (vm1_neg)
86 cy += lmmp_add_n_(dst + n, dst + n, vm1, 2 * n);
87 else
88 cy -= lmmp_sub_n_(dst + n, dst + n, vm1, 2 * n);
89
90 // no overflow, if s+t>n. proved.
91 lmmp_inc_1(dst + 2 * n, cy2);
92
93 if (cy < 0)
94 lmmp_dec(dst + 3 * n);
95 else
96 lmmp_inc_1(dst + 3 * n, cy);
98}
mp_limb_t * mp_ptr
Definition lmmp.h:215
#define lmmp_zero(dst, n)
Definition lmmp.h:366
uint64_t mp_size_t
Definition lmmp.h:212
int64_t mp_slimb_t
Definition lmmp.h:213
const mp_limb_t * mp_srcptr
Definition lmmp.h:216
uint64_t mp_limb_t
Definition lmmp.h:211
#define lmmp_param_assert(x)
Definition lmmp.h:398
static mp_limb_t lmmp_add_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
大数加法静态内联函数 [dst,na]=[numa,na]+[numb,nb]
Definition lmmpn.h:1058
static int lmmp_cmp_(mp_srcptr numa, mp_srcptr numb, mp_size_t n)
大数比较函数(内联)
Definition lmmpn.h:1004
#define lmmp_dec(p)
大数减1宏(预期无借位)
Definition lmmpn.h:973
void lmmp_mul_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
不等长大数乘法操作 [dst,na+nb] = [numa,na] * [numb,nb]
void lmmp_mul_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
等长大数乘法操作 [dst,2*n] = [numa,n] * [numb,n]
Definition mul.c:99
static mp_limb_t lmmp_sub_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
大数减法静态内联函数 [dst,na]=[numa,na]-[numb,nb]
Definition lmmpn.h:1072
mp_limb_t lmmp_sub_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
无借位的n位减法 [dst,n] = [numa,n] - [numb,n]
Definition sub_n.c:70
#define lmmp_inc_1(p, inc)
大数加指定值宏(预期无进位)
Definition lmmpn.h:958
mp_limb_t lmmp_add_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
无进位的n位加法 [dst,n] = [numa,n] + [numb,n]
Definition add_n.c:71
static int lmmp_zero_q_(mp_srcptr p, mp_size_t n)
大数判零函数(内联)
Definition lmmpn.h:1027
void lmmp_mul_toom22_(mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na, mp_srcptr restrict numb, mp_size_t nb)
Definition mul_toom22.c:23
#define b0
#define v0
#define b1
#define bsm1
#define a0
#define a1
#define asm1
#define vinf
#define vm1
#define SALLOC_TYPE(n, type)
Definition tmp_alloc.h:87
#define TEMP_S_DECL
Definition tmp_alloc.h:76
#define TEMP_S_FREE
Definition tmp_alloc.h:105