| OLD | NEW |
| 1 /* | 1 /* |
| 2 * Copyright 2012 The Android Open Source Project | 2 * Copyright 2012 The Android Open Source Project |
| 3 * | 3 * |
| 4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
| 5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
| 6 */ | 6 */ |
| 7 | 7 |
| 8 #include "SkBlitRow_opts_arm_neon.h" | 8 #include "SkBlitRow_opts_arm_neon.h" |
| 9 | 9 |
| 10 #include "SkBlitMask.h" | 10 #include "SkBlitMask.h" |
| 11 #include "SkBlitRow.h" | 11 #include "SkBlitRow.h" |
| 12 #include "SkColorPriv.h" | 12 #include "SkColorPriv.h" |
| 13 #include "SkDither.h" | 13 #include "SkDither.h" |
| 14 #include "SkMathPriv.h" | 14 #include "SkMathPriv.h" |
| 15 #include "SkUtils.h" | 15 #include "SkUtils.h" |
| 16 | 16 |
| 17 #include "SkCachePreload_arm.h" | 17 #include "SkCachePreload_arm.h" |
| 18 #include "SkColor_opts_neon.h" |
| 19 #include <arm_neon.h> |
| 18 | 20 |
| 19 #include <arm_neon.h> | 21 void S32_D565_Opaque_neon(uint16_t* SK_RESTRICT dst, |
| 22 const SkPMColor* SK_RESTRICT src, int count, |
| 23 U8CPU alpha, int /*x*/, int /*y*/) { |
| 24 SkASSERT(255 == alpha); |
| 25 |
| 26 while (count >= 8) { |
| 27 uint8x8x4_t vsrc; |
| 28 uint16x8_t vdst; |
| 29 |
| 30 // Load |
| 31 vsrc = vld4_u8((uint8_t*)src); |
| 32 |
| 33 // Convert src to 565 |
| 34 vdst = vshll_n_u8(vsrc.val[NEON_R], 8); |
| 35 vdst = vsriq_n_u16(vdst, vshll_n_u8(vsrc.val[NEON_G], 8), 5); |
| 36 vdst = vsriq_n_u16(vdst, vshll_n_u8(vsrc.val[NEON_B], 8), 5+6); |
| 37 |
| 38 // Store |
| 39 vst1q_u16(dst, vdst); |
| 40 |
| 41 // Prepare next iteration |
| 42 dst += 8; |
| 43 src += 8; |
| 44 count -= 8; |
| 45 }; |
| 46 |
| 47 // Leftovers |
| 48 while (count > 0) { |
| 49 SkPMColor c = *src++; |
| 50 SkPMColorAssert(c); |
| 51 *dst = SkPixel32ToPixel16_ToU16(c); |
| 52 dst++; |
| 53 count--; |
| 54 }; |
| 55 } |
| 20 | 56 |
| 21 void S32A_D565_Opaque_neon(uint16_t* SK_RESTRICT dst, | 57 void S32A_D565_Opaque_neon(uint16_t* SK_RESTRICT dst, |
| 22 const SkPMColor* SK_RESTRICT src, int count, | 58 const SkPMColor* SK_RESTRICT src, int count, |
| 23 U8CPU alpha, int /*x*/, int /*y*/) { | 59 U8CPU alpha, int /*x*/, int /*y*/) { |
| 24 SkASSERT(255 == alpha); | 60 SkASSERT(255 == alpha); |
| 25 | 61 |
| 26 if (count >= 8) { | 62 if (count >= 8) { |
| 27 uint16_t* SK_RESTRICT keep_dst = 0; | 63 uint16_t* SK_RESTRICT keep_dst = 0; |
| 28 | 64 |
| 29 asm volatile ( | 65 asm volatile ( |
| (...skipping 1293 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 1323 dst += 1; | 1359 dst += 1; |
| 1324 count--; | 1360 count--; |
| 1325 } | 1361 } |
| 1326 } | 1362 } |
| 1327 } | 1363 } |
| 1328 | 1364 |
| 1329 /////////////////////////////////////////////////////////////////////////////// | 1365 /////////////////////////////////////////////////////////////////////////////// |
| 1330 | 1366 |
| 1331 const SkBlitRow::Proc sk_blitrow_platform_565_procs_arm_neon[] = { | 1367 const SkBlitRow::Proc sk_blitrow_platform_565_procs_arm_neon[] = { |
| 1332 // no dither | 1368 // no dither |
| 1333 // NOTE: For the two functions below, we don't have a special version | 1369 // NOTE: For the S32_D565_Blend function below, we don't have a special |
| 1334 // that assumes that each source pixel is opaque. But our S32A is | 1370 // version that assumes that each source pixel is opaque. But our |
| 1335 // still faster than the default, so use it. | 1371 // S32A is still faster than the default, so use it. |
| 1336 S32A_D565_Opaque_neon, // really S32_D565_Opaque | 1372 S32_D565_Opaque_neon, |
| 1337 S32A_D565_Blend_neon, // really S32_D565_Blend | 1373 S32A_D565_Blend_neon, // really S32_D565_Blend |
| 1338 S32A_D565_Opaque_neon, | 1374 S32A_D565_Opaque_neon, |
| 1339 S32A_D565_Blend_neon, | 1375 S32A_D565_Blend_neon, |
| 1340 | 1376 |
| 1341 // dither | 1377 // dither |
| 1342 S32_D565_Opaque_Dither_neon, | 1378 S32_D565_Opaque_Dither_neon, |
| 1343 S32_D565_Blend_Dither_neon, | 1379 S32_D565_Blend_Dither_neon, |
| 1344 S32A_D565_Opaque_Dither_neon, | 1380 S32A_D565_Opaque_Dither_neon, |
| 1345 NULL, // S32A_D565_Blend_Dither | 1381 NULL, // S32A_D565_Blend_Dither |
| 1346 }; | 1382 }; |
| (...skipping 11 matching lines...) Expand all Loading... |
| 1358 * case where we do not inspect the src alpha. | 1394 * case where we do not inspect the src alpha. |
| 1359 */ | 1395 */ |
| 1360 #if SK_A32_SHIFT == 24 | 1396 #if SK_A32_SHIFT == 24 |
| 1361 // This proc assumes the alpha value occupies bits 24-32 of each SkPMColor | 1397 // This proc assumes the alpha value occupies bits 24-32 of each SkPMColor |
| 1362 S32A_Opaque_BlitRow32_neon_src_alpha, // S32A_Opaque, | 1398 S32A_Opaque_BlitRow32_neon_src_alpha, // S32A_Opaque, |
| 1363 #else | 1399 #else |
| 1364 S32A_Opaque_BlitRow32_neon, // S32A_Opaque, | 1400 S32A_Opaque_BlitRow32_neon, // S32A_Opaque, |
| 1365 #endif | 1401 #endif |
| 1366 S32A_Blend_BlitRow32_neon // S32A_Blend | 1402 S32A_Blend_BlitRow32_neon // S32A_Blend |
| 1367 }; | 1403 }; |
| OLD | NEW |