| Index: src/opts/SkNx_sse.h
 | 
| diff --git a/src/opts/SkNx_sse.h b/src/opts/SkNx_sse.h
 | 
| index 3e66637df3d551fdd681179527dc4d1c293aaee7..25a5cd8f84232027c0a011004a962e346ac63e6f 100644
 | 
| --- a/src/opts/SkNx_sse.h
 | 
| +++ b/src/opts/SkNx_sse.h
 | 
| @@ -478,4 +478,29 @@ static inline void Sk4h_store4(void* dst, const Sk4h& r, const Sk4h& g, const Sk
 | 
|      _mm_storeu_si128(((__m128i*) dst) + 1, hi);
 | 
|  }
 | 
|  
 | 
| +static inline void Sk4f_load4(const void* ptr, Sk4f* r, Sk4f* g, Sk4f* b, Sk4f* a) {
 | 
| +    __m128 v0 = _mm_loadu_ps(((float*)ptr) +  0),
 | 
| +           v1 = _mm_loadu_ps(((float*)ptr) +  4),
 | 
| +           v2 = _mm_loadu_ps(((float*)ptr) +  8),
 | 
| +           v3 = _mm_loadu_ps(((float*)ptr) + 12);
 | 
| +    _MM_TRANSPOSE4_PS(v0, v1, v2, v3);
 | 
| +    *r = v0;
 | 
| +    *g = v1;
 | 
| +    *b = v2;
 | 
| +    *a = v3;
 | 
| +}
 | 
| +
 | 
| +static inline void Sk4f_store4(void* dst, const Sk4f& r, const Sk4f& g, const Sk4f& b,
 | 
| +                               const Sk4f& a) {
 | 
| +    __m128 v0 = r.fVec,
 | 
| +           v1 = g.fVec,
 | 
| +           v2 = b.fVec,
 | 
| +           v3 = a.fVec;
 | 
| +    _MM_TRANSPOSE4_PS(v0, v1, v2, v3);
 | 
| +    _mm_storeu_ps(((float*) dst) +  0, v0);
 | 
| +    _mm_storeu_ps(((float*) dst) +  4, v1);
 | 
| +    _mm_storeu_ps(((float*) dst) +  8, v2);
 | 
| +    _mm_storeu_ps(((float*) dst) + 12, v3);
 | 
| +}
 | 
| +
 | 
|  #endif//SkNx_sse_DEFINED
 | 
| 
 |