Fixes color issue when scaling without breaking mingw. BUG=https://bugs.chromium.org/p/libyuv/issues/detail?id=605 BUG=https://bugs.chromium.org/p/webm/issues/detail?id=1252 Change-Id: I09437d93fd65964ad57113274d8c819f3eaf2e57
		
			
				
	
	
		
			65 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			65 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/*
 | 
						|
 *  Copyright 2012 The LibYuv Project Authors. All rights reserved.
 | 
						|
 *
 | 
						|
 *  Use of this source code is governed by a BSD-style license
 | 
						|
 *  that can be found in the LICENSE file in the root of the source
 | 
						|
 *  tree. An additional intellectual property rights grant can be found
 | 
						|
 *  in the file PATENTS. All contributing project authors may
 | 
						|
 *  be found in the AUTHORS file in the root of the source tree.
 | 
						|
 */
 | 
						|
 | 
						|
#include "libyuv/basic_types.h"
 | 
						|
 | 
						|
#include "libyuv/compare_row.h"
 | 
						|
#include "libyuv/row.h"
 | 
						|
 | 
						|
#ifdef __cplusplus
 | 
						|
namespace libyuv {
 | 
						|
extern "C" {
 | 
						|
#endif
 | 
						|
 | 
						|
#if !defined(LIBYUV_DISABLE_NEON) && defined(__aarch64__)
 | 
						|
 | 
						|
uint32 SumSquareError_NEON(const uint8* src_a, const uint8* src_b, int count) {
 | 
						|
  volatile uint32 sse;
 | 
						|
  asm volatile (
 | 
						|
    "eor        v16.16b, v16.16b, v16.16b      \n"
 | 
						|
    "eor        v18.16b, v18.16b, v18.16b      \n"
 | 
						|
    "eor        v17.16b, v17.16b, v17.16b      \n"
 | 
						|
    "eor        v19.16b, v19.16b, v19.16b      \n"
 | 
						|
 | 
						|
  "1:                                          \n"
 | 
						|
    MEMACCESS(0)
 | 
						|
    "ld1        {v0.16b}, [%0], #16            \n"
 | 
						|
    MEMACCESS(1)
 | 
						|
    "ld1        {v1.16b}, [%1], #16            \n"
 | 
						|
    "subs       %w2, %w2, #16                  \n"
 | 
						|
    "usubl      v2.8h, v0.8b, v1.8b            \n"
 | 
						|
    "usubl2     v3.8h, v0.16b, v1.16b          \n"
 | 
						|
    "smlal      v16.4s, v2.4h, v2.4h           \n"
 | 
						|
    "smlal      v17.4s, v3.4h, v3.4h           \n"
 | 
						|
    "smlal2     v18.4s, v2.8h, v2.8h           \n"
 | 
						|
    "smlal2     v19.4s, v3.8h, v3.8h           \n"
 | 
						|
    "b.gt       1b                             \n"
 | 
						|
 | 
						|
    "add        v16.4s, v16.4s, v17.4s         \n"
 | 
						|
    "add        v18.4s, v18.4s, v19.4s         \n"
 | 
						|
    "add        v19.4s, v16.4s, v18.4s         \n"
 | 
						|
    "addv       s0, v19.4s                     \n"
 | 
						|
    "fmov       %w3, s0                        \n"
 | 
						|
    : "+r"(src_a),
 | 
						|
      "+r"(src_b),
 | 
						|
      "+r"(count),
 | 
						|
      "=r"(sse)
 | 
						|
    :
 | 
						|
    : "cc", "v0", "v1", "v2", "v3", "v16", "v17", "v18", "v19");
 | 
						|
  return sse;
 | 
						|
}
 | 
						|
 | 
						|
#endif  // !defined(LIBYUV_DISABLE_NEON) && defined(__aarch64__)
 | 
						|
 | 
						|
#ifdef __cplusplus
 | 
						|
}  // extern "C"
 | 
						|
}  // namespace libyuv
 | 
						|
#endif
 |