LAMMP 4.1.0
Lamina High-Precision Arithmetic Library
载入中...
搜索中...
未找到
sqr_toom3.c 文件参考
+ sqr_toom3.c 的引用(Include)关系图:

浏览源代码.

宏定义

#define a0   numa
 
#define a1   (numa + n)
 
#define a2   (numa + 2 * n)
 
#define am1   (dst)
 
#define ap1   tp
 
#define ap2   ap1
 
#define v0   dst
 
#define v1   (dst + 2 * n)
 
#define v2   (tp + 2 * n + 2)
 
#define vinf   (dst + 4 * n)
 
#define vm1   tp
 

函数

void lmmp_sqr_toom3_ (mp_ptr restrict dst, mp_srcptr restrict numa, mp_size_t na)
 

宏定义说明

◆ a0

#define a0   numa

◆ a1

#define a1   (numa + n)

◆ a2

#define a2   (numa + 2 * n)

◆ am1

#define am1   (dst)

◆ ap1

#define ap1   tp

◆ ap2

#define ap2   ap1

◆ v0

#define v0   dst

◆ v1

#define v1   (dst + 2 * n)

◆ v2

#define v2   (tp + 2 * n + 2)

◆ vinf

#define vinf   (dst + 4 * n)

◆ vm1

#define vm1   tp

函数说明

◆ lmmp_sqr_toom3_()

void lmmp_sqr_toom3_ ( mp_ptr restrict  dst,
mp_srcptr restrict  numa,
mp_size_t  na 
)

在文件 sqr_toom3.c23 行定义.

23 {
24 lmmp_param_assert(na > 0);
25 lmmp_param_assert(numa != NULL);
26 lmmp_param_assert(dst != NULL);
28 mp_size_t n = (na + 2) / 3, s = na - 2 * n;
29 mp_limb_t cy, cy2, vinf0, am1h;
30 mp_limb_t* restrict tp = SALLOC_TYPE(4 * n + 4, mp_limb_t);
31
32#define a0 numa
33#define a1 (numa + n)
34#define a2 (numa + 2 * n)
35
36#define v0 dst //[dst,2*n]
37#define v1 (dst + 2 * n) //[dst+2*n,2*n+1]
38#define vinf (dst + 4 * n) //[dst+4*n,s+t]
39#define vm1 tp //[tp,2*n+1]
40#define v2 (tp + 2 * n + 2) //[tp+2*n+2,2*n+1]
41
42#define am1 (dst) //[dst,n]
43#define ap1 tp //[tp,n+1]
44#define ap2 ap1 // same space
45
46 // ap1, am1
47 cy = lmmp_add_(ap1, a0, n, a2, s);
48 if (cy == 0 && lmmp_cmp_(ap1, a1, n) < 0) {
49 cy = lmmp_add_n_sub_n_(ap1, am1, a1, ap1, n);
50 ap1[n] = cy >> 1;
51 am1h = 0;
52 } else {
53 cy2 = lmmp_add_n_sub_n_(ap1, am1, ap1, a1, n);
54 ap1[n] = cy + (cy2 >> 1);
55 am1h = cy - (cy2 & 1);
56 }
57
58 // vinf
59 lmmp_sqr_(vinf, a2, s);
60 vinf0 = vinf[0]; // overlap with v1
61 cy = vinf[1]; // overlap with v1
62
63 // v1
64 lmmp_sqr_(v1, ap1, n + 1);
65 vinf[1] = cy; // restore, since v1[2*n+1]==0.
66
67 // ap2
68 cy = lmmp_addshl1_n_(ap2, a1, a2, s);
69 if (s != n)
70 cy = lmmp_add_1_(ap2 + s, a1 + s, n - s, cy);
71 cy = 2 * cy + lmmp_addshl1_n_(ap2, a0, ap2, n);
72 ap2[n] = cy;
73
74 // v2
75 lmmp_sqr_(v2, ap2, n + 1);
76
77 // vm1
78 lmmp_sqr_(vm1, am1, n);
79 if (am1h)
80 am1h += lmmp_addshl1_n_(vm1 + n, vm1 + n, am1, n);
81 vm1[2 * n] = am1h;
82
83 // v0
84 lmmp_sqr_(v0, a0, n);
85
86 lmmp_toom_interp5_(dst, v2, vm1, n, s + s, 0, vinf0);
88}
uint64_t mp_size_t
Definition lmmp.h:212
uint64_t mp_limb_t
Definition lmmp.h:211
#define lmmp_param_assert(x)
Definition lmmp.h:398
static mp_limb_t lmmp_add_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_srcptr numb, mp_size_t nb)
大数加法静态内联函数 [dst,na]=[numa,na]+[numb,nb]
Definition lmmpn.h:1058
static int lmmp_cmp_(mp_srcptr numa, mp_srcptr numb, mp_size_t n)
大数比较函数(内联)
Definition lmmpn.h:1004
static mp_limb_t lmmp_add_1_(mp_ptr dst, mp_srcptr numa, mp_size_t na, mp_limb_t x)
大数加单精度数静态内联函数 [dst,na]=[numa,na]+x
Definition lmmpn.h:1111
void lmmp_sqr_(mp_ptr dst, mp_srcptr numa, mp_size_t na)
大数平方操作 [dst,2*na] = [numa,na]^2
Definition sqr.c:10
mp_limb_t lmmp_addshl1_n_(mp_ptr dst, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
加法结合左移1位操作 [dst,n] = [numa,n] + ([numb,n] << 1)
Definition shl.c:56
mp_limb_t lmmp_add_n_sub_n_(mp_ptr dsta, mp_ptr dstb, mp_srcptr numa, mp_srcptr numb, mp_size_t n)
同时执行n位加法和减法 ([dsta,n],[dstb,n]) = ([numa,n]+[numb,n],[numa,n]-[numb,n])
Definition add_n_sub_n.c:10
#define tp
#define ap2
#define v0
#define am1
#define ap1
#define v2
#define vm1
#define a2
#define a0
#define a1
#define vinf
#define v1
#define SALLOC_TYPE(n, type)
Definition tmp_alloc.h:87
#define TEMP_S_DECL
Definition tmp_alloc.h:76
#define TEMP_S_FREE
Definition tmp_alloc.h:105
void lmmp_toom_interp5_(mp_ptr dst, mp_ptr v2, mp_ptr vm1, mp_size_t n, mp_size_t spt, int vm1_neg, mp_limb_t vinf0)
Toom插值计算(5点插值),用于Toom-33和Toom-42乘法算法

引用了 a0, a1, a2, am1, ap1, ap2, lmmp_add_(), lmmp_add_1_(), lmmp_add_n_sub_n_(), lmmp_addshl1_n_(), lmmp_cmp_(), lmmp_param_assert, lmmp_sqr_(), lmmp_toom_interp5_(), SALLOC_TYPE, TEMP_S_DECL, TEMP_S_FREE, tp, v0, v1, v2, vinf , 以及 vm1.

+ 函数调用图: