ref: dd33c656daf8dc2658dfe7a435ff4bc65a4474eb
parent: d9892e846f893b3547d223b2de230b52d5b9462d
parent: 5c22224e9e43befc414cce2cf163616c9d56b0d3
author: Debargha Mukherjee <debargha@google.com>
date: Thu Dec 11 07:28:45 EST 2014
Merge "Corrected optimization of 8x8 DCT code"
--- a/vp9/common/x86/vp9_idct_intrin_sse2.c
+++ b/vp9/common/x86/vp9_idct_intrin_sse2.c
@@ -4260,7 +4260,7 @@
// N.B. Only first 4 cols contain non-zero coeffs
max_input = _mm_max_epi16(inptr[0], inptr[1]);
min_input = _mm_min_epi16(inptr[0], inptr[1]);
- for (i = 2; i < 4; i++) {
+ for (i = 2; i < 8; i++) {
max_input = _mm_max_epi16(max_input, inptr[i]);
min_input = _mm_min_epi16(min_input, inptr[i]);
}
--
⑨