|  | /* | 
|  | *  Copyright (c) 2014 The WebM project authors. All Rights Reserved. | 
|  | * | 
|  | *  Use of this source code is governed by a BSD-style license | 
|  | *  that can be found in the LICENSE file in the root of the source | 
|  | *  tree. An additional intellectual property rights grant can be found | 
|  | *  in the file PATENTS.  All contributing project authors may | 
|  | *  be found in the AUTHORS file in the root of the source tree. | 
|  | */ | 
|  |  | 
|  | #include "./vpx_config.h" | 
|  | #include "./vpx_dsp_rtcd.h" | 
|  | #include "vpx_dsp/x86/convolve.h" | 
|  |  | 
|  | #if HAVE_SSE2 | 
|  | filter8_1dfunction vpx_filter_block1d16_v8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_h8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_v8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_h8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_v8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_h8_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_v8_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_h8_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_v8_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_h8_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_v8_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_h8_avg_sse2; | 
|  |  | 
|  | filter8_1dfunction vpx_filter_block1d16_v2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_h2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_v2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_h2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_v2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_h2_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_v2_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d16_h2_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_v2_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d8_h2_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_v2_avg_sse2; | 
|  | filter8_1dfunction vpx_filter_block1d4_h2_avg_sse2; | 
|  |  | 
|  | // void vpx_convolve8_horiz_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                               uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                               const int16_t *filter_x, int x_step_q4, | 
|  | //                               const int16_t *filter_y, int y_step_q4, | 
|  | //                               int w, int h); | 
|  | // void vpx_convolve8_vert_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                              uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                              const int16_t *filter_x, int x_step_q4, | 
|  | //                              const int16_t *filter_y, int y_step_q4, | 
|  | //                              int w, int h); | 
|  | // void vpx_convolve8_avg_horiz_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                                   uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                                   const int16_t *filter_x, int x_step_q4, | 
|  | //                                   const int16_t *filter_y, int y_step_q4, | 
|  | //                                   int w, int h); | 
|  | // void vpx_convolve8_avg_vert_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                                  uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                                  const int16_t *filter_x, int x_step_q4, | 
|  | //                                  const int16_t *filter_y, int y_step_q4, | 
|  | //                                  int w, int h); | 
|  | FUN_CONV_1D(horiz, x_step_q4, filter_x, h, src, , sse2); | 
|  | FUN_CONV_1D(vert, y_step_q4, filter_y, v, src - src_stride * 3, , sse2); | 
|  | FUN_CONV_1D(avg_horiz, x_step_q4, filter_x, h, src, avg_, sse2); | 
|  | FUN_CONV_1D(avg_vert, y_step_q4, filter_y, v, src - src_stride * 3, avg_, sse2); | 
|  |  | 
|  | // void vpx_convolve8_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                         uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                         const int16_t *filter_x, int x_step_q4, | 
|  | //                         const int16_t *filter_y, int y_step_q4, | 
|  | //                         int w, int h); | 
|  | // void vpx_convolve8_avg_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                             uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                             const int16_t *filter_x, int x_step_q4, | 
|  | //                             const int16_t *filter_y, int y_step_q4, | 
|  | //                             int w, int h); | 
|  | FUN_CONV_2D(, sse2); | 
|  | FUN_CONV_2D(avg_ , sse2); | 
|  |  | 
|  | #if CONFIG_VP9_HIGHBITDEPTH && ARCH_X86_64 | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_v8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_h8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_v8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_h8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_v8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_h8_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_v8_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_h8_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_v8_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_h8_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_v8_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_h8_avg_sse2; | 
|  |  | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_v2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_h2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_v2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_h2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_v2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_h2_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_v2_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d16_h2_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_v2_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d8_h2_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_v2_avg_sse2; | 
|  | highbd_filter8_1dfunction vpx_highbd_filter_block1d4_h2_avg_sse2; | 
|  |  | 
|  | // void vpx_highbd_convolve8_horiz_sse2(const uint8_t *src, | 
|  | //                                      ptrdiff_t src_stride, | 
|  | //                                      uint8_t *dst, | 
|  | //                                      ptrdiff_t dst_stride, | 
|  | //                                      const int16_t *filter_x, | 
|  | //                                      int x_step_q4, | 
|  | //                                      const int16_t *filter_y, | 
|  | //                                      int y_step_q4, | 
|  | //                                      int w, int h, int bd); | 
|  | // void vpx_highbd_convolve8_vert_sse2(const uint8_t *src, | 
|  | //                                     ptrdiff_t src_stride, | 
|  | //                                     uint8_t *dst, | 
|  | //                                     ptrdiff_t dst_stride, | 
|  | //                                     const int16_t *filter_x, | 
|  | //                                     int x_step_q4, | 
|  | //                                     const int16_t *filter_y, | 
|  | //                                     int y_step_q4, | 
|  | //                                     int w, int h, int bd); | 
|  | // void vpx_highbd_convolve8_avg_horiz_sse2(const uint8_t *src, | 
|  | //                                          ptrdiff_t src_stride, | 
|  | //                                          uint8_t *dst, | 
|  | //                                          ptrdiff_t dst_stride, | 
|  | //                                          const int16_t *filter_x, | 
|  | //                                          int x_step_q4, | 
|  | //                                          const int16_t *filter_y, | 
|  | //                                          int y_step_q4, | 
|  | //                                          int w, int h, int bd); | 
|  | // void vpx_highbd_convolve8_avg_vert_sse2(const uint8_t *src, | 
|  | //                                         ptrdiff_t src_stride, | 
|  | //                                         uint8_t *dst, | 
|  | //                                         ptrdiff_t dst_stride, | 
|  | //                                         const int16_t *filter_x, | 
|  | //                                         int x_step_q4, | 
|  | //                                         const int16_t *filter_y, | 
|  | //                                         int y_step_q4, | 
|  | //                                         int w, int h, int bd); | 
|  | HIGH_FUN_CONV_1D(horiz, x_step_q4, filter_x, h, src, , sse2); | 
|  | HIGH_FUN_CONV_1D(vert, y_step_q4, filter_y, v, src - src_stride * 3, , sse2); | 
|  | HIGH_FUN_CONV_1D(avg_horiz, x_step_q4, filter_x, h, src, avg_, sse2); | 
|  | HIGH_FUN_CONV_1D(avg_vert, y_step_q4, filter_y, v, src - src_stride * 3, avg_, | 
|  | sse2); | 
|  |  | 
|  | // void vpx_highbd_convolve8_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                                uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                                const int16_t *filter_x, int x_step_q4, | 
|  | //                                const int16_t *filter_y, int y_step_q4, | 
|  | //                                int w, int h, int bd); | 
|  | // void vpx_highbd_convolve8_avg_sse2(const uint8_t *src, ptrdiff_t src_stride, | 
|  | //                                    uint8_t *dst, ptrdiff_t dst_stride, | 
|  | //                                    const int16_t *filter_x, int x_step_q4, | 
|  | //                                    const int16_t *filter_y, int y_step_q4, | 
|  | //                                    int w, int h, int bd); | 
|  | HIGH_FUN_CONV_2D(, sse2); | 
|  | HIGH_FUN_CONV_2D(avg_ , sse2); | 
|  | #endif  // CONFIG_VP9_HIGHBITDEPTH && ARCH_X86_64 | 
|  | #endif  // HAVE_SSE2 |