Lines Matching +full:2 +full:d

12 	ld1	{v17.2d},[x1]		//load input H
14 shl v19.2d,v19.2d,#57 //0xc2.0
16 ushr v18.2d,v19.2d,#63
19 ushr v18.2d,v3.2d,#63
22 shl v3.2d,v3.2d,#1
27 st1 {v20.2d},[x0],#16 //store Htable[0]
29 //calculate H^2
31 pmull v0.1q,v20.1d,v20.1d
33 pmull2 v2.1q,v20.2d,v20.2d
34 pmull v1.1q,v16.1d,v16.1d
40 pmull v18.1q,v0.1d,v19.1d //1st phase
42 ins v2.d[0],v1.d[1]
43 ins v1.d[1],v0.d[0]
46 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase
47 pmull v0.1q,v0.1d,v19.1d
54 st1 {v21.2d,v22.2d},[x0],#32 //store Htable[1..2]
56 pmull v0.1q,v20.1d, v22.1d
57 pmull v5.1q,v22.1d,v22.1d
58 pmull2 v2.1q,v20.2d, v22.2d
59 pmull2 v7.1q,v22.2d,v22.2d
60 pmull v1.1q,v16.1d,v17.1d
61 pmull v6.1q,v17.1d,v17.1d
70 pmull v18.1q,v0.1d,v19.1d //1st phase
72 pmull v4.1q,v5.1d,v19.1d
74 ins v2.d[0],v1.d[1]
75 ins v7.d[0],v6.d[1]
76 ins v1.d[1],v0.d[0]
77 ins v6.d[1],v5.d[0]
81 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase
83 pmull v0.1q,v0.1d,v19.1d
84 pmull v5.1q,v5.1d,v19.1d
95 st1 {v20.2d,v21.2d,v22.2d},[x0] //store Htable[3..5]
103 ld1 {v17.2d},[x0] //load Xi
105 ld1 {v20.2d,v21.2d},[x1] //load twisted H, ...
106 shl v19.2d,v19.2d,#57
112 pmull v0.1q,v20.1d,v3.1d //H.lo·Xi.lo
114 pmull2 v2.1q,v20.2d,v3.2d //H.hi·Xi.hi
115 pmull v1.1q,v21.1d,v17.1d //(H.lo+H.hi)·(Xi.lo+Xi.hi)
121 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
123 ins v2.d[0],v1.d[1]
124 ins v1.d[1],v0.d[0]
127 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
128 pmull v0.1q,v0.1d,v19.1d
136 st1 {v0.2d},[x0] //write out Xi
147 ld1 {v0.2d},[x0] //load [rotated] Xi
163 ld1 {v20.2d,v21.2d},[x1],#32 //load twisted H, ..., H^2
165 ld1 {v22.2d},[x1]
168 ld1 {v16.2d},[x2],#16 //load [rotated] I[0]
169 shl v19.2d,v19.2d,#57 //compose 0xc2.0 constant
176 ld1 {v17.2d},[x2],x12 //load [rotated] I[1]
182 pmull v4.1q,v20.1d,v7.1d //H·Ii+1
184 pmull2 v6.1q,v20.2d,v7.2d
191 pmull v0.1q,v22.1d,v3.1d //H^2.lo·Xi.lo
194 pmull v5.1q,v21.1d,v17.1d
196 pmull2 v2.1q,v22.2d,v3.2d //H^2.hi·Xi.hi
198 pmull2 v1.1q,v21.2d,v18.2d //(H^2.lo+H^2.hi)·(Xi.lo+Xi.hi)
199 ld1 {v16.2d},[x2],x12 //load [rotated] I[i+2]
208 ld1 {v17.2d},[x2],x12 //load [rotated] I[i+3]
213 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
218 ins v2.d[0],v1.d[1]
219 ins v1.d[1],v0.d[0]
223 pmull v4.1q,v20.1d,v7.1d //H·Ii+1
226 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
227 pmull v0.1q,v0.1d,v19.1d
231 pmull2 v6.1q,v20.2d,v7.2d
244 pmull v0.1q,v20.1d,v3.1d //H.lo·Xi.lo
246 pmull2 v2.1q,v20.2d,v3.2d //H.hi·Xi.hi
247 pmull v1.1q,v21.1d,v17.1d //(H.lo+H.hi)·(Xi.lo+Xi.hi)
253 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
255 ins v2.d[0],v1.d[1]
256 ins v1.d[1],v0.d[0]
259 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
260 pmull v0.1q,v0.1d,v19.1d
269 st1 {v0.2d},[x0] //write out Xi
277 ld1 {v0.2d},[x0] //load [rotated] Xi
278 ld1 {v20.2d,v21.2d,v22.2d},[x1],#48 //load twisted H, ..., H^2
280 ld1 {v26.2d,v27.2d,v28.2d},[x1] //load twisted H^3, ..., H^4
281 shl v19.2d,v19.2d,#57 //compose 0xc2.0 constant
283 ld1 {v4.2d,v5.2d,v6.2d,v7.2d},[x2],#64
295 pmull v29.1q,v20.1d,v25.1d //H·Ii+3
297 pmull2 v31.1q,v20.2d,v25.2d
298 pmull v30.1q,v21.1d,v7.1d
300 pmull v16.1q,v22.1d,v24.1d //H^2·Ii+2
302 pmull2 v24.1q,v22.2d,v24.2d
303 pmull2 v6.1q,v21.2d,v6.2d
309 pmull v7.1q,v26.1d,v23.1d //H^3·Ii+1
311 pmull2 v23.1q,v26.2d,v23.2d
312 pmull v5.1q,v27.1d,v5.1d
326 ld1 {v4.2d,v5.2d,v6.2d,v7.2d},[x2],#64
335 pmull v0.1q,v28.1d,v3.1d //H^4·(Xi+Ii)
337 pmull2 v2.1q,v28.2d,v3.2d
339 pmull2 v1.1q,v27.2d,v16.2d
349 pmull v29.1q,v20.1d,v25.1d //H·Ii+3
352 pmull2 v31.1q,v20.2d,v25.2d
354 pmull v30.1q,v21.1d,v7.1d
356 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
357 ins v2.d[0],v1.d[1]
358 ins v1.d[1],v0.d[0]
359 pmull v16.1q,v22.1d,v24.1d //H^2·Ii+2
361 pmull2 v24.1q,v22.2d,v24.2d
363 pmull2 v6.1q,v21.2d,v6.2d
369 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
370 pmull v0.1q,v0.1d,v19.1d
371 pmull v7.1q,v26.1d,v23.1d //H^3·Ii+1
374 pmull2 v23.1q,v26.2d,v23.2d
375 pmull v5.1q,v27.1d,v5.1d
390 pmull v0.1q,v28.1d,v3.1d //H^4·(Xi+Ii)
392 pmull2 v2.1q,v28.2d,v3.2d
393 pmull2 v1.1q,v27.2d,v16.2d
409 ld1 {v4.2d,v5.2d,v6.2d},[x2]
417 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
418 ins v2.d[0],v1.d[1]
419 ins v1.d[1],v0.d[0]
424 pmull v29.1q,v20.1d,v24.1d //H·Ii+2
427 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
428 pmull v0.1q,v0.1d,v19.1d
430 pmull2 v31.1q,v20.2d,v24.2d
431 pmull v30.1q,v21.1d,v6.1d
433 pmull v7.1q,v22.1d,v23.1d //H^2·Ii+1
437 pmull2 v23.1q,v22.2d,v23.2d
439 pmull2 v5.1q,v21.2d,v5.2d
446 pmull v0.1q,v26.1d,v3.1d //H^3·(Xi+Ii)
448 pmull2 v2.1q,v26.2d,v3.2d
449 pmull v1.1q,v27.1d,v16.1d
461 ld1 {v4.2d,v5.2d},[x2]
468 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
469 ins v2.d[0],v1.d[1]
470 ins v1.d[1],v0.d[0]
474 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
475 pmull v0.1q,v0.1d,v19.1d
480 pmull v29.1q,v20.1d,v23.1d //H·Ii+1
486 pmull2 v31.1q,v20.2d,v23.2d
487 pmull v30.1q,v21.1d,v5.1d
489 pmull v0.1q,v22.1d,v3.1d //H^2·(Xi+Ii)
491 pmull2 v2.1q,v22.2d,v3.2d
492 pmull2 v1.1q,v21.2d,v16.2d
504 ld1 {v4.2d},[x2]
510 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
511 ins v2.d[0],v1.d[1]
512 ins v1.d[1],v0.d[0]
515 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
516 pmull v0.1q,v0.1d,v19.1d
524 pmull v0.1q,v20.1d,v3.1d
526 pmull2 v2.1q,v20.2d,v3.2d
527 pmull v1.1q,v21.1d,v16.1d
535 pmull v18.1q,v0.1d,v19.1d //1st phase of reduction
536 ins v2.d[0],v1.d[1]
537 ins v1.d[1],v0.d[0]
540 ext v18.16b,v0.16b,v0.16b,#8 //2nd phase of reduction
541 pmull v0.1q,v0.1d,v19.1d
549 st1 {v0.2d},[x0] //write out Xi
554 .align 2
555 .align 2