b1 = (tmp[i + 0] - tmp[i + 8]) * 23170;
c1 = tmp[i + 4] * 12540 - tmp[i + 12] * 30274;
d1 = tmp[i + 4] * 30274 + tmp[i + 12] * 12540;
- dc[i*4+0] = 0;
- dc[i*4+1] = 0;
- dc[i*4+2] = 0;
- dc[i*4+3] = 0;
+ AV_ZERO64(dc + i*4);
block[0][i][0] = (a1 + d1 + 0x20000) >> 18;
block[3][i][0] = (a1 - d1 + 0x20000) >> 18;
block[1][i][0] = (b1 + c1 + 0x20000) >> 18;
b1 = (block[i*4+0] - block[i*4+2]) * 23170;
c1 = block[i*4+1] * 12540 - block[i*4+3] * 30274;
d1 = block[i*4+1] * 30274 + block[i*4+3] * 12540;
- block[i*4+0] = 0;
- block[i*4+1] = 0;
- block[i*4+2] = 0;
- block[i*4+3] = 0;
+ AV_ZERO64(block + i*4);
tmp[i*4+0] = (a1 + d1) >> 14;
tmp[i*4+3] = (a1 - d1) >> 14;
tmp[i*4+1] = (b1 + c1) >> 14;
t1 = dc[i*4+1] + dc[i*4+2];
t2 = dc[i*4+1] - dc[i*4+2];
t3 = dc[i*4+0] - dc[i*4+3] + 3; // rounding
- dc[i*4+0] = 0;
- dc[i*4+1] = 0;
- dc[i*4+2] = 0;
- dc[i*4+3] = 0;
+ AV_ZERO64(dc + i*4);
block[i][0][0] = (t0 + t1) >> 3;
block[i][1][0] = (t3 + t2) >> 3;