shithub: libvpx

Download patch

ref: b2120948391f8beb7ff74bd46b83da1ff2020f49
parent: 48178d2cf284a7cdc4cb7973dab190e386de5af1
parent: 23d1c06268e884ee65d3d67943c62c26a7e369b7
author: Scott LaVarnway <[email protected]>
date: Tue Oct 6 07:35:15 EDT 2015

Merge "VPX: refactor vpx_idct32x32_1_add_sse2()"

--- a/vpx_dsp/x86/inv_txfm_sse2.c
+++ b/vpx_dsp/x86/inv_txfm_sse2.c
@@ -3474,7 +3474,7 @@
                               int stride) {
   __m128i dc_value;
   const __m128i zero = _mm_setzero_si128();
-  int a, i;
+  int a, j;
 
   a = dct_const_round_shift(input[0] * cospi_16_64);
   a = dct_const_round_shift(a * cospi_16_64);
@@ -3482,12 +3482,11 @@
 
   dc_value = _mm_set1_epi16(a);
 
-  for (i = 0; i < 4; ++i) {
-    int j;
-    for (j = 0; j < 32; ++j) {
-      RECON_AND_STORE(dest + j * stride, dc_value);
-    }
-    dest += 8;
+  for (j = 0; j < 32; ++j) {
+    RECON_AND_STORE(dest +  0 + j * stride, dc_value);
+    RECON_AND_STORE(dest +  8 + j * stride, dc_value);
+    RECON_AND_STORE(dest + 16 + j * stride, dc_value);
+    RECON_AND_STORE(dest + 24 + j * stride, dc_value);
   }
 }