include/libyuv/macros_msa.h - Issue 2285683002: Add MIPS SIMD Arch (MSA) optimized MirrorRow function

Side by Side Diff: include/libyuv/macros_msa.h

Issue 2285683002: Add MIPS SIMD Arch (MSA) optimized MirrorRow function (Closed)

Patch Set: Incorporated review comments Created 4 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

OLD	NEW
(Empty)
	1 /*

	2 * Copyright 2016 The LibYuv Project Authors. All rights reserved.

	3 *

	4 * Use of this source code is governed by a BSD-style license

	5 * that can be found in the LICENSE file in the root of the source

	6 * tree. An additional intellectual property rights grant can be found

	7 * in the file PATENTS. All contributing project authors may

	8 * be found in the AUTHORS file in the root of the source tree.

	9 */

	10

	11 #ifndef __MACROS_MSA_H__

	12 #define __MACROS_MSA_H__

	13

	14 #if !defined(LIBYUV_DISABLE_MSA) && defined(__mips_msa)

	15 #include <stdint.h>

	16 #include <msa.h>

	17

	18 #define LD_B(RTYPE, psrc) ((RTYPE)(psrc))

	19 #define LD_UB(...) LD_B(v16u8, __VA_ARGS__)

	20

	21 #define ST_B(RTYPE, in, pdst) ((RTYPE)(pdst)) = (in)

	22 #define ST_UB(...) ST_B(v16u8, __VA_ARGS__)

	23

	24 /* Description : Load two vectors with 16 'byte' sized elements

	25 Arguments : Inputs - psrc, stride

	26 Outputs - out0, out1

	27 Return Type - as per RTYPE

	28 Details : Load 16 byte elements in 'out0' from (psrc)

	29 Load 16 byte elements in 'out1' from (psrc + stride)

	30 */

	31 #define LD_B2(RTYPE, psrc, stride, out0, out1) \

	32 { \

	33 out0 = LD_B(RTYPE, (psrc)); \

	34 out1 = LD_B(RTYPE, (psrc) + stride); \

	35 }

	36 #define LD_UB2(...) LD_B2(v16u8, __VA_ARGS__)

	37 #define LD_SB2(...) LD_B2(v16i8, __VA_ARGS__)

	38

	39 #define LD_B4(RTYPE, psrc, stride, out0, out1, out2, out3) \

	40 { \

	41 LD_B2(RTYPE, (psrc), stride, out0, out1); \

	42 LD_B2(RTYPE, (psrc) + 2 * stride , stride, out2, out3); \

	43 }

	44 #define LD_UB4(...) LD_B4(v16u8, __VA_ARGS__)

	45 #define LD_SB4(...) LD_B4(v16i8, __VA_ARGS__)

	46

	47 /* Description : Store two vectors with stride each having 16 'byte' sized

	48 elements

	49 Arguments : Inputs - in0, in1, pdst, stride

	50 Details : Store 16 byte elements from 'in0' to (pdst)

	51 Store 16 byte elements from 'in1' to (pdst + stride)

	52 */

	53 #define ST_B2(RTYPE, in0, in1, pdst, stride) \

	54 { \

	55 ST_B(RTYPE, in0, (pdst)); \

	56 ST_B(RTYPE, in1, (pdst) + stride); \

	57 }

	58 #define ST_UB2(...) ST_B2(v16u8, __VA_ARGS__)

	59 #define ST_SB2(...) ST_B2(v16i8, __VA_ARGS__)

	60

	61 #define ST_B4(RTYPE, in0, in1, in2, in3, pdst, stride) \

	62 { \

	63 ST_B2(RTYPE, in0, in1, (pdst), stride); \

	64 ST_B2(RTYPE, in2, in3, (pdst) + 2 * stride, stride); \

	65 }

	66 #define ST_UB4(...) ST_B4(v16u8, __VA_ARGS__)

	67 #define ST_SB4(...) ST_B4(v16i8, __VA_ARGS__)

	68

	69 /* Description : Shuffle byte vector elements as per mask vector

	70 Arguments : Inputs - in0, in1, in2, in3, mask0, mask1

	71 Outputs - out0, out1

	72 Return Type - as per RTYPE

	73 Details : Byte elements from 'in0' & 'in1' are copied selectively to

	74 'out0' as per control vector 'mask0'

	75 */

	76 #define VSHF_B2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1) \

	77 { \

	78 out0 = (RTYPE) __msa_vshf_b((v16i8) mask0, (v16i8) in1, (v16i8) in0); \
	fbarchard1 2016/09/17 01:01:30 nit just a style thing, but I would find the sourc nit just a style thing, but I would find the source (row_msa.cc) more readable using the __msa_vshf_b() intrinsic directly. manojkumar.bhosale 2016/09/19 08:07:21 Done styling. Show quoted text On 2016/09/17 01:01:30, fbarchard1 wrote: > nit just a style thing, but I would find the source (row_msa.cc) more readable > using the __msa_vshf_b() intrinsic directly. Done styling.
	79 out1 = (RTYPE) __msa_vshf_b((v16i8) mask1, (v16i8) in3, (v16i8) in2); \

	80 }

	81 #define VSHF_B2_UB(...) VSHF_B2(v16u8, __VA_ARGS__)

	82 #endif /* !defined(LIBYUV_DISABLE_MSA) && defined(__mips_msa) */

	83 #endif /* __MACROS_MSA_H__ */

OLD	NEW

« no previous file with comments | « include/libyuv/cpu_id.h ('k') | include/libyuv/row.h » ('j') | include/libyuv/row.h » ('J')