- FOR_LIMB(j, 0, 8, {
- accum2 = 0;
- FOR_LIMB(i, 0, j + 1, {
- accum2 += widemul(a[j - i], b[i]);
- accum1 += widemul(aa[j - i], bb[i]);
- accum0 += widemul(a[8 + j - i], b[8 + i]);
- }
- ); accum1 -= accum2; accum0 += accum2;
- accum2 = 0;
- FOR_LIMB(i, j + 1, 8, {
- accum0 -=
- widemul(a[8 + j - i], b[i]);
- accum2 +=
- widemul(aa[8 + j - i],
- bb[i]);
- accum1 += widemul(a[16 + j - i], b[8 + i]);
- }
- );
- accum1 += accum2;
- accum0 += accum2;
- c[j] = ((uint32_t)(accum0)) & mask;
- c[j + 8] = ((uint32_t)(accum1)) & mask;
- accum0 >>= 28; accum1 >>= 28;
- });
+ for (j = 0; j < 8; j++) {
+ accum2 = 0;
+ for (i = 0; i < j + 1; i++) {
+ accum2 += widemul(a[j - i], b[i]);
+ accum1 += widemul(aa[j - i], bb[i]);
+ accum0 += widemul(a[8 + j - i], b[8 + i]);
+ }
+ accum1 -= accum2;
+ accum0 += accum2;
+ accum2 = 0;
+ for (i = j + 1; i < 8; i++) {
+ accum0 -= widemul(a[8 + j - i], b[i]);
+ accum2 += widemul(aa[8 + j - i], bb[i]);
+ accum1 += widemul(a[16 + j - i], b[8 + i]);
+ }
+ accum1 += accum2;
+ accum0 += accum2;
+ c[j] = ((uint32_t)(accum0)) & mask;
+ c[j + 8] = ((uint32_t)(accum1)) & mask;
+ accum0 >>= 28;
+ accum1 >>= 28;
+ }