d5/db9/add__n__sub__n_8c_source.html

/*

 * LAMMP - Copyright (C) 2025-2026 HJimmyK(Jericho Knox)

 * This file is part of lammp, under the GNU LGPL v2 license.

 * See LICENSE in the project root for the full license text.

 */


#include "../../include/lammp/impl/mparam.h"

#include "../../include/lammp/lmmpn.h"


mp_limb_t lmmp_add_n_sub_n_(mp_ptr dsta, mp_ptr dstb, mp_srcptr numa, mp_srcptr numb, mp_size_t n) {

    /*

    这段代码看起来有点奇怪的原因是，对于使用x64汇编时，我们会使用带进位的加法和减法，而x64中

    只能使用同一个进位寄存器，所以我们需要将两条指令分开执行。

    而不使用汇编时，编译器通常不会使用进位寄存器。因此我们可以同时读取两路内存，以减少读写次数。

    */

#ifdef USE_ASM

    mp_limb_t acyo = 0, scyo = 0;

    mp_size_t off, this_n;


    if (dsta != numa && dsta != numb) {

        for (off = 0; off < n; off += PART_SIZE) {

            this_n = LMMP_MIN(n - off, PART_SIZE);

            acyo = lmmp_add_nc_(dsta + off, numa + off, numb + off, this_n, acyo);

            scyo = lmmp_sub_nc_(dstb + off, numa + off, numb + off, this_n, scyo);

        }

    } else if (dstb != numa && dstb != numb) {

        for (off = 0; off < n; off += PART_SIZE) {

            this_n = LMMP_MIN(n - off, PART_SIZE);

            scyo = lmmp_sub_nc_(dstb + off, numa + off, numb + off, this_n, scyo);

            acyo = lmmp_add_nc_(dsta + off, numa + off, numb + off, this_n, acyo);

        }

    } else {

        mp_limb_t tp[PART_SIZE];

        for (off = 0; off < n; off += PART_SIZE) {

            this_n = LMMP_MIN(n - off, PART_SIZE);

            acyo = lmmp_add_nc_(tp, numa + off, numb + off, this_n, acyo);

            scyo = lmmp_sub_nc_(dstb + off, numa + off, numb + off, this_n, scyo);

            lmmp_copy(dsta + off, tp, this_n);

        }

    }

    return 2 * acyo + scyo;

#else

    mp_size_t i;

    mp_limb_t acyo, scyo;


    for (i = 0, acyo = 0, scyo = 0; i < n; i++) {

        mp_limb_t a, b, r;

        a = numa[i];

        b = numb[i];

        r = a + acyo;

        acyo = (r < acyo);

        r += b;

        acyo += (r < b);

        dsta[i] = r;


        b += scyo;

        scyo = (b < scyo);

        scyo += (a < b);

        dstb[i] = a - b;

    }

    return 2 * acyo + scyo;

#endif

}


lmmp_add_n_sub_n_
mp_limb_t lmmp_add_n_sub_n_(mp_ptr dsta, mp_ptr dstb, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
同时执行n位加法和减法 ([dsta,n],[dstb,n]) = ([numa,n]+[numb,n],[numa,n]-[numb,n])
Definition add_n_sub_n.c:10

mp_ptr
mp_limb_t * mp_ptr
Definition lmmp.h:215

lmmp_copy
#define lmmp_copy(dst, src, n)
Definition lmmp.h:364

mp_size_t
uint64_t mp_size_t
Definition lmmp.h:212

mp_srcptr
const mp_limb_t * mp_srcptr
Definition lmmp.h:216

mp_limb_t
uint64_t mp_limb_t
Definition lmmp.h:211

LMMP_MIN
#define LMMP_MIN(l, o)
Definition lmmp.h:348

lmmp_add_nc_
mp_limb_t lmmp_add_nc_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n, mp_limb_t c)
带进位的n位加法 [dst,n] = [numa,n] + [numb,n] + c
Definition add_n.c:9

lmmp_sub_nc_
mp_limb_t lmmp_sub_nc_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n, mp_limb_t c)
带借位的n位减法 [dst,n] = [numa,n] - [numb,n] - c
Definition sub_n.c:9

PART_SIZE
#define PART_SIZE
Definition mparam.h:89

tp
#define tp