/* * Copyright 2011 The LibYuv Project Authors. All rights reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree.
*/
static uint32_t ARGBDetectRow_C(const uint8_t* argb, int width) { int x; for (x = 0; x < width - 1; x += 2) { if (argb[0] != 255) { // First byte is not Alpha of 255, so not ARGB. return FOURCC_BGRA;
} if (argb[3] != 255) { // Fourth byte is not Alpha of 255, so not BGRA. return FOURCC_ARGB;
} if (argb[4] != 255) { // Second pixel first byte is not Alpha of 255. return FOURCC_BGRA;
} if (argb[7] != 255) { // Second pixel fourth byte is not Alpha of 255. return FOURCC_ARGB;
}
argb += 8;
} if (width & 1) { if (argb[0] != 255) { // First byte is not Alpha of 255, so not ARGB. return FOURCC_BGRA;
} if (argb[3] != 255) { // 4th byte is not Alpha of 255, so not BGRA. return FOURCC_ARGB;
}
} return 0;
}
// Scan an opaque argb image and return fourcc based on alpha offset. // Returns FOURCC_ARGB, FOURCC_BGRA, or 0 if unknown.
LIBYUV_API
uint32_t ARGBDetect(const uint8_t* argb, int stride_argb, int width, int height) {
uint32_t fourcc = 0; int h;
// NEON version accumulates in 16 bit shorts which overflow at 65536 bytes. // So actual maximum is 1 less loop, which is 64436 - 32 bytes.
LIBYUV_API
uint64_t ComputeHammingDistance(const uint8_t* src_a, const uint8_t* src_b, int count) { constint kBlockSize = 1 << 15; // 32768; constint kSimdSize = 64; // SIMD for multiple of 64, and C for remainder int remainder = count & (kBlockSize - 1) & ~(kSimdSize - 1);
uint64_t diff = 0; int i;
uint32_t (*HammingDistance)(const uint8_t* src_a, const uint8_t* src_b, int count) = HammingDistance_C; #ifdefined(HAS_HAMMINGDISTANCE_NEON) if (TestCpuFlag(kCpuHasNEON)) {
HammingDistance = HammingDistance_NEON;
} #endif #ifdefined(HAS_HAMMINGDISTANCE_SSSE3) if (TestCpuFlag(kCpuHasSSSE3)) {
HammingDistance = HammingDistance_SSSE3;
} #endif #ifdefined(HAS_HAMMINGDISTANCE_SSE42) if (TestCpuFlag(kCpuHasSSE42)) {
HammingDistance = HammingDistance_SSE42;
} #endif #ifdefined(HAS_HAMMINGDISTANCE_AVX2) if (TestCpuFlag(kCpuHasAVX2)) {
HammingDistance = HammingDistance_AVX2;
} #endif #ifdefined(HAS_HAMMINGDISTANCE_MMI) if (TestCpuFlag(kCpuHasMMI)) {
HammingDistance = HammingDistance_MMI;
} #endif #ifdefined(HAS_HAMMINGDISTANCE_MSA) if (TestCpuFlag(kCpuHasMSA)) {
HammingDistance = HammingDistance_MSA;
} #endif
#ifdef _OPENMP #pragma omp parallel for reduction(+ : diff) #endif for (i = 0; i < (count - (kBlockSize - 1)); i += kBlockSize) {
diff += HammingDistance(src_a + i, src_b + i, kBlockSize);
}
src_a += count & ~(kBlockSize - 1);
src_b += count & ~(kBlockSize - 1); if (remainder) {
diff += HammingDistance(src_a, src_b, remainder);
src_a += remainder;
src_b += remainder;
}
remainder = count & (kSimdSize - 1); if (remainder) {
diff += HammingDistance_C(src_a, src_b, remainder);
} return diff;
}
// TODO(fbarchard): Refactor into row function.
LIBYUV_API
uint64_t ComputeSumSquareError(const uint8_t* src_a, const uint8_t* src_b, int count) { // SumSquareError returns values 0 to 65535 for each squared difference. // Up to 65536 of those can be summed and remain within a uint32_t. // After each block of 65536 pixels, accumulate into a uint64_t. constint kBlockSize = 65536; int remainder = count & (kBlockSize - 1) & ~31;
uint64_t sse = 0; int i;
uint32_t (*SumSquareError)(const uint8_t* src_a, const uint8_t* src_b, int count) = SumSquareError_C; #ifdefined(HAS_SUMSQUAREERROR_NEON) if (TestCpuFlag(kCpuHasNEON)) {
SumSquareError = SumSquareError_NEON;
} #endif #ifdefined(HAS_SUMSQUAREERROR_SSE2) if (TestCpuFlag(kCpuHasSSE2)) { // Note only used for multiples of 16 so count is not checked.
SumSquareError = SumSquareError_SSE2;
} #endif #ifdefined(HAS_SUMSQUAREERROR_AVX2) if (TestCpuFlag(kCpuHasAVX2)) { // Note only used for multiples of 32 so count is not checked.
SumSquareError = SumSquareError_AVX2;
} #endif #ifdefined(HAS_SUMSQUAREERROR_MMI) if (TestCpuFlag(kCpuHasMMI)) {
SumSquareError = SumSquareError_MMI;
} #endif #ifdefined(HAS_SUMSQUAREERROR_MSA) if (TestCpuFlag(kCpuHasMSA)) {
SumSquareError = SumSquareError_MSA;
} #endif #ifdef _OPENMP #pragma omp parallel for reduction(+ : sse) #endif for (i = 0; i < (count - (kBlockSize - 1)); i += kBlockSize) {
sse += SumSquareError(src_a + i, src_b + i, kBlockSize);
}
src_a += count & ~(kBlockSize - 1);
src_b += count & ~(kBlockSize - 1); if (remainder) {
sse += SumSquareError(src_a, src_b, remainder);
src_a += remainder;
src_b += remainder;
}
remainder = count & 31; if (remainder) {
sse += SumSquareError_C(src_a, src_b, remainder);
} return sse;
}
LIBYUV_API
uint64_t ComputeSumSquareErrorPlane(const uint8_t* src_a, int stride_a, const uint8_t* src_b, int stride_b, int width, int height) {
uint64_t sse = 0; int h; // Coalesce rows. if (stride_a == width && stride_b == width) {
width *= height;
height = 1;
stride_a = stride_b = 0;
} for (h = 0; h < height; ++h) {
sse += ComputeSumSquareError(src_a, src_b, width);
src_a += stride_a;
src_b += stride_b;
} return sse;
}
// We are using a 8x8 moving window with starting location of each 8x8 window // on the 4x4 pixel grid. Such arrangement allows the windows to overlap // block boundaries to penalize blocking artifacts.
LIBYUV_API double CalcFrameSsim(const uint8_t* src_a, int stride_a, const uint8_t* src_b, int stride_b, int width, int height) { int samples = 0; double ssim_total = 0; double (*Ssim8x8)(const uint8_t* src_a, int stride_a, const uint8_t* src_b, int stride_b) = Ssim8x8_C;
// sample point start with each 4x4 location int i; for (i = 0; i < height - 8; i += 4) { int j; for (j = 0; j < width - 8; j += 4) {
ssim_total += Ssim8x8(src_a + j, stride_a, src_b + j, stride_b);
samples++;
}
Die Informationen auf dieser Webseite wurden
nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit,
noch Qualität der bereit gestellten Informationen zugesichert.
Bemerkung:
Die farbliche Syntaxdarstellung und die Messung sind noch experimentell.