shithub: libvpx

Download patch

ref: f6c6f37e0cf6b09d9ce753870f8d4644e8fb557e
parent: 6624f20785bb782ad02edc27a60403946c11ff29
parent: 8334a48d3ac0c567f662b90cf4e66aeee88cf68a
author: Scott LaVarnway <[email protected]>
date: Thu Aug 3 19:17:09 EDT 2017

Merge "vpx_dsp: Use correct check for halfpel in"

--- a/vpx_dsp/x86/variance_impl_avx2.c
+++ b/vpx_dsp/x86/variance_impl_avx2.c
@@ -305,7 +305,7 @@
   }
 }
 
-// (x == 0, y == 8) or (x == 8, y == 0).  sstep determines the direction.
+// (x == 0, y == 4) or (x == 4, y == 0).  sstep determines the direction.
 static INLINE void spv32_half_zero(const uint8_t *src, int src_stride,
                                    const uint8_t *dst, int dst_stride,
                                    const uint8_t *sec, int sec_stride,
@@ -335,7 +335,7 @@
   }
 }
 
-static INLINE void spv32_x0_y8(const uint8_t *src, int src_stride,
+static INLINE void spv32_x0_y4(const uint8_t *src, int src_stride,
                                const uint8_t *dst, int dst_stride,
                                const uint8_t *sec, int sec_stride, int do_sec,
                                int height, __m256i *sum_reg, __m256i *sse_reg) {
@@ -343,7 +343,7 @@
                   height, sum_reg, sse_reg, src_stride);
 }
 
-static INLINE void spv32_x8_y0(const uint8_t *src, int src_stride,
+static INLINE void spv32_x4_y0(const uint8_t *src, int src_stride,
                                const uint8_t *dst, int dst_stride,
                                const uint8_t *sec, int sec_stride, int do_sec,
                                int height, __m256i *sum_reg, __m256i *sse_reg) {
@@ -351,7 +351,7 @@
                   height, sum_reg, sse_reg, 1);
 }
 
-static INLINE void spv32_x8_y8(const uint8_t *src, int src_stride,
+static INLINE void spv32_x4_y4(const uint8_t *src, int src_stride,
                                const uint8_t *dst, int dst_stride,
                                const uint8_t *sec, int sec_stride, int do_sec,
                                int height, __m256i *sum_reg, __m256i *sse_reg) {
@@ -387,7 +387,7 @@
   }
 }
 
-// (x == 0, y == bil) or (x == 8, y == bil).  sstep determines the direction.
+// (x == 0, y == bil) or (x == 4, y == bil).  sstep determines the direction.
 static INLINE void spv32_bilin_zero(const uint8_t *src, int src_stride,
                                     const uint8_t *dst, int dst_stride,
                                     const uint8_t *sec, int sec_stride,
@@ -439,7 +439,7 @@
                    height, sum_reg, sse_reg, x_offset, 1);
 }
 
-static INLINE void spv32_x8_yb(const uint8_t *src, int src_stride,
+static INLINE void spv32_x4_yb(const uint8_t *src, int src_stride,
                                const uint8_t *dst, int dst_stride,
                                const uint8_t *sec, int sec_stride, int do_sec,
                                int height, __m256i *sum_reg, __m256i *sse_reg,
@@ -478,7 +478,7 @@
   }
 }
 
-static INLINE void spv32_xb_y8(const uint8_t *src, int src_stride,
+static INLINE void spv32_xb_y4(const uint8_t *src, int src_stride,
                                const uint8_t *dst, int dst_stride,
                                const uint8_t *sec, int sec_stride, int do_sec,
                                int height, __m256i *sum_reg, __m256i *sse_reg,
@@ -599,9 +599,9 @@
     if (y_offset == 0) {
       spv32_x0_y0(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg);
-      // x_offset = 0 and y_offset = 8
-    } else if (y_offset == 8) {
-      spv32_x0_y8(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
+      // x_offset = 0 and y_offset = 4
+    } else if (y_offset == 4) {
+      spv32_x0_y4(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg);
       // x_offset = 0 and y_offset = bilin interpolation
     } else {
@@ -608,18 +608,18 @@
       spv32_x0_yb(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg, y_offset);
     }
-    // x_offset = 8  and y_offset = 0
-  } else if (x_offset == 8) {
+    // x_offset = 4  and y_offset = 0
+  } else if (x_offset == 4) {
     if (y_offset == 0) {
-      spv32_x8_y0(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
+      spv32_x4_y0(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg);
-      // x_offset = 8  and y_offset = 8
-    } else if (y_offset == 8) {
-      spv32_x8_y8(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
+      // x_offset = 4  and y_offset = 4
+    } else if (y_offset == 4) {
+      spv32_x4_y4(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg);
-      // x_offset = 8  and y_offset = bilin interpolation
+      // x_offset = 4  and y_offset = bilin interpolation
     } else {
-      spv32_x8_yb(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
+      spv32_x4_yb(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg, y_offset);
     }
     // x_offset = bilin interpolation and y_offset = 0
@@ -627,9 +627,9 @@
     if (y_offset == 0) {
       spv32_xb_y0(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg, x_offset);
-      // x_offset = bilin interpolation and y_offset = 8
-    } else if (y_offset == 8) {
-      spv32_xb_y8(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
+      // x_offset = bilin interpolation and y_offset = 4
+    } else if (y_offset == 4) {
+      spv32_xb_y4(src, src_stride, dst, dst_stride, sec, sec_stride, do_sec,
                   height, &sum_reg, &sse_reg, x_offset);
       // x_offset = bilin interpolation and y_offset = bilin interpolation
     } else {