michael@0: /* michael@0: * Copyright (c) 2010 The WebM project authors. All Rights Reserved. michael@0: * michael@0: * Use of this source code is governed by a BSD-style license michael@0: * that can be found in the LICENSE file in the root of the source michael@0: * tree. An additional intellectual property rights grant can be found michael@0: * in the file PATENTS. All contributing project authors may michael@0: * be found in the AUTHORS file in the root of the source tree. michael@0: */ michael@0: michael@0: michael@0: #include michael@0: #include michael@0: #include "vpx_config.h" michael@0: #include "vpx/vpx_integer.h" michael@0: michael@0: static unsigned int sad_mx_n_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad, int m, int n) michael@0: { michael@0: int r, c; michael@0: unsigned int sad = 0; michael@0: michael@0: for (r = 0; r < n; r++) michael@0: { michael@0: for (c = 0; c < m; c++) michael@0: { michael@0: sad += abs(src_ptr[c] - ref_ptr[c]); michael@0: } michael@0: michael@0: if (sad > max_sad) michael@0: break; michael@0: michael@0: src_ptr += src_stride; michael@0: ref_ptr += ref_stride; michael@0: } michael@0: michael@0: return sad; michael@0: } michael@0: michael@0: /* max_sad is provided as an optional optimization point. Alternative michael@0: * implementations of these functions are not required to check it. michael@0: */ michael@0: michael@0: unsigned int vp8_sad16x16_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad) michael@0: { michael@0: return sad_mx_n_c(src_ptr, src_stride, ref_ptr, ref_stride, max_sad, 16, 16); michael@0: } michael@0: michael@0: unsigned int vp8_sad8x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad) michael@0: { michael@0: return sad_mx_n_c(src_ptr, src_stride, ref_ptr, ref_stride, max_sad, 8, 8); michael@0: } michael@0: michael@0: unsigned int vp8_sad16x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad) michael@0: { michael@0: return sad_mx_n_c(src_ptr, src_stride, ref_ptr, ref_stride, max_sad, 16, 8); michael@0: michael@0: } michael@0: michael@0: unsigned int vp8_sad8x16_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad) michael@0: { michael@0: return sad_mx_n_c(src_ptr, src_stride, ref_ptr, ref_stride, max_sad, 8, 16); michael@0: } michael@0: michael@0: unsigned int vp8_sad4x4_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int max_sad) michael@0: { michael@0: return sad_mx_n_c(src_ptr, src_stride, ref_ptr, ref_stride, max_sad, 4, 4); michael@0: } michael@0: michael@0: void vp8_sad16x16x3_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad16x16x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned short *sad_array) michael@0: { michael@0: sad_array[0] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: sad_array[3] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 3, ref_stride, UINT_MAX); michael@0: sad_array[4] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 4, ref_stride, UINT_MAX); michael@0: sad_array[5] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 5, ref_stride, UINT_MAX); michael@0: sad_array[6] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 6, ref_stride, UINT_MAX); michael@0: sad_array[7] = (unsigned short)vp8_sad16x16_c(src_ptr, src_stride, ref_ptr + 7, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad16x8x3_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad16x8x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned short *sad_array) michael@0: { michael@0: sad_array[0] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: sad_array[3] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 3, ref_stride, UINT_MAX); michael@0: sad_array[4] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 4, ref_stride, UINT_MAX); michael@0: sad_array[5] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 5, ref_stride, UINT_MAX); michael@0: sad_array[6] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 6, ref_stride, UINT_MAX); michael@0: sad_array[7] = (unsigned short)vp8_sad16x8_c(src_ptr, src_stride, ref_ptr + 7, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x8x3_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x8x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned short *sad_array) michael@0: { michael@0: sad_array[0] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: sad_array[3] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 3, ref_stride, UINT_MAX); michael@0: sad_array[4] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 4, ref_stride, UINT_MAX); michael@0: sad_array[5] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 5, ref_stride, UINT_MAX); michael@0: sad_array[6] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 6, ref_stride, UINT_MAX); michael@0: sad_array[7] = (unsigned short)vp8_sad8x8_c(src_ptr, src_stride, ref_ptr + 7, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x16x3_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x16x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned short *sad_array) michael@0: { michael@0: sad_array[0] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: sad_array[3] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 3, ref_stride, UINT_MAX); michael@0: sad_array[4] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 4, ref_stride, UINT_MAX); michael@0: sad_array[5] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 5, ref_stride, UINT_MAX); michael@0: sad_array[6] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 6, ref_stride, UINT_MAX); michael@0: sad_array[7] = (unsigned short)vp8_sad8x16_c(src_ptr, src_stride, ref_ptr + 7, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad4x4x3_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad4x4x8_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char *ref_ptr, int ref_stride, michael@0: unsigned short *sad_array) michael@0: { michael@0: sad_array[0] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 0, ref_stride, UINT_MAX); michael@0: sad_array[1] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 1, ref_stride, UINT_MAX); michael@0: sad_array[2] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 2, ref_stride, UINT_MAX); michael@0: sad_array[3] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 3, ref_stride, UINT_MAX); michael@0: sad_array[4] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 4, ref_stride, UINT_MAX); michael@0: sad_array[5] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 5, ref_stride, UINT_MAX); michael@0: sad_array[6] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 6, ref_stride, UINT_MAX); michael@0: sad_array[7] = (unsigned short)vp8_sad4x4_c(src_ptr, src_stride, ref_ptr + 7, ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad16x16x4d_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char * const ref_ptr[], int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr[0], ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr[1], ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr[2], ref_stride, UINT_MAX); michael@0: sad_array[3] = vp8_sad16x16_c(src_ptr, src_stride, ref_ptr[3], ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad16x8x4d_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char * const ref_ptr[], int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr[0], ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr[1], ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr[2], ref_stride, UINT_MAX); michael@0: sad_array[3] = vp8_sad16x8_c(src_ptr, src_stride, ref_ptr[3], ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x8x4d_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char * const ref_ptr[], int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr[0], ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr[1], ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr[2], ref_stride, UINT_MAX); michael@0: sad_array[3] = vp8_sad8x8_c(src_ptr, src_stride, ref_ptr[3], ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad8x16x4d_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char * const ref_ptr[], int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr[0], ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr[1], ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr[2], ref_stride, UINT_MAX); michael@0: sad_array[3] = vp8_sad8x16_c(src_ptr, src_stride, ref_ptr[3], ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: void vp8_sad4x4x4d_c(const unsigned char *src_ptr, int src_stride, michael@0: const unsigned char * const ref_ptr[], int ref_stride, michael@0: unsigned int *sad_array) michael@0: { michael@0: sad_array[0] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr[0], ref_stride, UINT_MAX); michael@0: sad_array[1] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr[1], ref_stride, UINT_MAX); michael@0: sad_array[2] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr[2], ref_stride, UINT_MAX); michael@0: sad_array[3] = vp8_sad4x4_c(src_ptr, src_stride, ref_ptr[3], ref_stride, UINT_MAX); michael@0: } michael@0: michael@0: /* Copy 2 macroblocks to a buffer */ michael@0: void vp8_copy32xn_c(unsigned char *src_ptr, int src_stride, michael@0: unsigned char *dst_ptr, int dst_stride, michael@0: int height) michael@0: { michael@0: int r; michael@0: michael@0: for (r = 0; r < height; r++) michael@0: { michael@0: #if !(CONFIG_FAST_UNALIGNED) michael@0: dst_ptr[0] = src_ptr[0]; michael@0: dst_ptr[1] = src_ptr[1]; michael@0: dst_ptr[2] = src_ptr[2]; michael@0: dst_ptr[3] = src_ptr[3]; michael@0: dst_ptr[4] = src_ptr[4]; michael@0: dst_ptr[5] = src_ptr[5]; michael@0: dst_ptr[6] = src_ptr[6]; michael@0: dst_ptr[7] = src_ptr[7]; michael@0: dst_ptr[8] = src_ptr[8]; michael@0: dst_ptr[9] = src_ptr[9]; michael@0: dst_ptr[10] = src_ptr[10]; michael@0: dst_ptr[11] = src_ptr[11]; michael@0: dst_ptr[12] = src_ptr[12]; michael@0: dst_ptr[13] = src_ptr[13]; michael@0: dst_ptr[14] = src_ptr[14]; michael@0: dst_ptr[15] = src_ptr[15]; michael@0: dst_ptr[16] = src_ptr[16]; michael@0: dst_ptr[17] = src_ptr[17]; michael@0: dst_ptr[18] = src_ptr[18]; michael@0: dst_ptr[19] = src_ptr[19]; michael@0: dst_ptr[20] = src_ptr[20]; michael@0: dst_ptr[21] = src_ptr[21]; michael@0: dst_ptr[22] = src_ptr[22]; michael@0: dst_ptr[23] = src_ptr[23]; michael@0: dst_ptr[24] = src_ptr[24]; michael@0: dst_ptr[25] = src_ptr[25]; michael@0: dst_ptr[26] = src_ptr[26]; michael@0: dst_ptr[27] = src_ptr[27]; michael@0: dst_ptr[28] = src_ptr[28]; michael@0: dst_ptr[29] = src_ptr[29]; michael@0: dst_ptr[30] = src_ptr[30]; michael@0: dst_ptr[31] = src_ptr[31]; michael@0: #else michael@0: ((uint32_t *)dst_ptr)[0] = ((uint32_t *)src_ptr)[0] ; michael@0: ((uint32_t *)dst_ptr)[1] = ((uint32_t *)src_ptr)[1] ; michael@0: ((uint32_t *)dst_ptr)[2] = ((uint32_t *)src_ptr)[2] ; michael@0: ((uint32_t *)dst_ptr)[3] = ((uint32_t *)src_ptr)[3] ; michael@0: ((uint32_t *)dst_ptr)[4] = ((uint32_t *)src_ptr)[4] ; michael@0: ((uint32_t *)dst_ptr)[5] = ((uint32_t *)src_ptr)[5] ; michael@0: ((uint32_t *)dst_ptr)[6] = ((uint32_t *)src_ptr)[6] ; michael@0: ((uint32_t *)dst_ptr)[7] = ((uint32_t *)src_ptr)[7] ; michael@0: #endif michael@0: src_ptr += src_stride; michael@0: dst_ptr += dst_stride; michael@0: michael@0: } michael@0: }