[go: nahoru, domu]

f66ad85
diff -up chromium-48.0.2564.103/third_party/skia/src/opts/SkXfermode_opts.h.gcc6 chromium-48.0.2564.103/third_party/skia/src/opts/SkXfermode_opts.h
f66ad85
--- chromium-48.0.2564.103/third_party/skia/src/opts/SkXfermode_opts.h.gcc6	2016-02-16 15:01:13.200131996 -0500
f66ad85
+++ chromium-48.0.2564.103/third_party/skia/src/opts/SkXfermode_opts.h	2016-02-17 13:31:50.216198258 -0500
f66ad85
@@ -109,76 +109,71 @@ XFERMODE(Lighten) {
f66ad85
 }
f66ad85
 #undef XFERMODE
f66ad85
 
f66ad85
-// Some xfermodes use math like divide or sqrt that's best done in floats.
f66ad85
-// We write it generically, then call it 1 or 2 pixels at a time (T == Sk4f or Sk8f).
f66ad85
-#define XFERMODE(Name) struct Name { template <typename T> T operator()(const T&, const T&); }; \
f66ad85
-    template <typename T> T Name::operator()(const T& d, const T& s)
f66ad85
+// Some xfermodes use math like divide or sqrt that's best done in floats 1 pixel at a time.
f66ad85
+#define XFERMODE(Name) static Sk4f SK_VECTORCALL Name(Sk4f d, Sk4f s)
f66ad85
 
f66ad85
-static_assert(SK_A32_SHIFT == 24, "");
f66ad85
 static inline Sk4f a_rgb(const Sk4f& a, const Sk4f& rgb) {
f66ad85
+    static_assert(SK_A32_SHIFT == 24, "");
f66ad85
     return a * Sk4f(0,0,0,1) + rgb * Sk4f(1,1,1,0);
f66ad85
 }
f66ad85
-static inline Sk8f a_rgb(const Sk8f& a, const Sk8f& rgb) {
f66ad85
-    // TODO: SkNx_blend<0,0,0,1,0,0,0,1>(a, rgb) to let us use _mm256_blend_ps?
f66ad85
-    return a * Sk8f(0,0,0,1,0,0,0,1) + rgb * Sk8f(1,1,1,0,1,1,1,0);
f66ad85
+static inline Sk4f alphas(const Sk4f& f) {
f66ad85
+    return SkNx_dup<SK_A32_SHIFT/8>(f);
f66ad85
 }
f66ad85
-static inline Sk4f alphas(const Sk4f& f) { return SkNx_shuffle<3,3,3,3>        (f); }
f66ad85
-static inline Sk8f alphas(const Sk8f& f) { return SkNx_shuffle<3,3,3,3,7,7,7,7>(f); }
f66ad85
 
f66ad85
 XFERMODE(ColorDodge) {
f66ad85
     auto sa = alphas(s),
f66ad85
          da = alphas(d),
f66ad85
-         isa = T(1)-sa,
f66ad85
-         ida = T(1)-da;
f66ad85
+         isa = Sk4f(1)-sa,
f66ad85
+         ida = Sk4f(1)-da;
f66ad85
 
f66ad85
     auto srcover = s + d*isa,
f66ad85
          dstover = d + s*ida,
f66ad85
-         otherwise = sa * T::Min(da, (d*sa)*(sa-s).approxInvert()) + s*ida + d*isa;
f66ad85
+         otherwise = sa * Sk4f::Min(da, (d*sa)*(sa-s).approxInvert()) + s*ida + d*isa;
f66ad85
 
f66ad85
     // Order matters here, preferring d==0 over s==sa.
f66ad85
-    auto colors = (d ==  0).thenElse(dstover,
f66ad85
-                  (s == sa).thenElse(srcover,
f66ad85
-                                     otherwise));
f66ad85
+    auto colors = (d == Sk4f(0)).thenElse(dstover,
f66ad85
+                  (s ==      sa).thenElse(srcover,
f66ad85
+                                          otherwise));
f66ad85
     return a_rgb(srcover, colors);
f66ad85
 }
f66ad85
 XFERMODE(ColorBurn) {
f66ad85
     auto sa = alphas(s),
f66ad85
          da = alphas(d),
f66ad85
-         isa = T(1)-sa,
f66ad85
-         ida = T(1)-da;
f66ad85
+         isa = Sk4f(1)-sa,
f66ad85
+         ida = Sk4f(1)-da;
f66ad85
 
f66ad85
     auto srcover = s + d*isa,
f66ad85
          dstover = d + s*ida,
f66ad85
-         otherwise = sa*(da-T::Min(da, (da-d)*sa*s.approxInvert())) + s*ida + d*isa;
f66ad85
+         otherwise = sa*(da-Sk4f::Min(da, (da-d)*sa*s.approxInvert())) + s*ida + d*isa;
f66ad85
 
f66ad85
     // Order matters here, preferring d==da over s==0.
f66ad85
-    auto colors = (d == da).thenElse(dstover,
f66ad85
-                  (s ==  0).thenElse(srcover,
f66ad85
-                                     otherwise));
f66ad85
+    auto colors = (d ==      da).thenElse(dstover,
f66ad85
+                  (s == Sk4f(0)).thenElse(srcover,
f66ad85
+                                          otherwise));
f66ad85
     return a_rgb(srcover, colors);
f66ad85
 }
f66ad85
 XFERMODE(SoftLight) {
f66ad85
     auto sa = alphas(s),
f66ad85
          da = alphas(d),
f66ad85
-         isa = T(1)-sa,
f66ad85
-         ida = T(1)-da;
f66ad85
+         isa = Sk4f(1)-sa,
f66ad85
+         ida = Sk4f(1)-da;
f66ad85
 
f66ad85
     // Some common terms.
f66ad85
-    auto m  = (da > 0).thenElse(d / da, 0),
f66ad85
-         s2 = s*2,
f66ad85
-         m4 = m*4;
f66ad85
+    auto m  = (da > Sk4f(0)).thenElse(d / da, Sk4f(0)),
f66ad85
+         s2 = Sk4f(2)*s,
f66ad85
+         m4 = Sk4f(4)*m;
f66ad85
 
f66ad85
     // The logic forks three ways:
f66ad85
     //    1. dark src?
f66ad85
     //    2. light src, dark dst?
f66ad85
     //    3. light src, light dst?
f66ad85
-    auto darkSrc = d*(sa + (s2 - sa)*(T(1) - m)),  // Used in case 1.
f66ad85
-         darkDst = (m4*m4 + m4)*(m - 1) + m*7,     // Used in case 2.
f66ad85
-         liteDst = m.sqrt() - m,                   // Used in case 3.
f66ad85
-         liteSrc = d*sa + da*(s2-sa)*(d*4 <= da).thenElse(darkDst, liteDst); // Case 2 or 3?
f66ad85
+    auto darkSrc = d*(sa + (s2 - sa)*(Sk4f(1) - m)),        // Used in case 1.
f66ad85
+         darkDst = (m4*m4 + m4)*(m - Sk4f(1)) + Sk4f(7)*m,  // Used in case 2.
f66ad85
+         liteDst = m.sqrt() - m,                            // Used in case 3.
f66ad85
+         liteSrc = d*sa + da*(s2-sa)*(Sk4f(4)*d <= da).thenElse(darkDst, liteDst); // Case 2 or 3?
f66ad85
 
f66ad85
     auto alpha  = s + d*isa;
f66ad85
-    auto colors = s*ida + d*isa + (s2 <= sa).thenElse(darkSrc, liteSrc);     // Case 1 or 2/3?
f66ad85
+    auto colors = s*ida + d*isa + (s2 <= sa).thenElse(darkSrc, liteSrc);           // Case 1 or 2/3?
f66ad85
 
f66ad85
     return a_rgb(alpha, colors);
f66ad85
 }
f66ad85
@@ -245,52 +240,53 @@ private:
f66ad85
     typedef SkProcCoeffXfermode INHERITED;
f66ad85
 };
f66ad85
 
f66ad85
-template <typename BlendFn>
f66ad85
-class FloatXfermode : public SkProcCoeffXfermode {
f66ad85
+class Sk4fXfermode : public SkProcCoeffXfermode {
f66ad85
 public:
f66ad85
-    FloatXfermode(const ProcCoeff& rec, SkXfermode::Mode mode)
f66ad85
-        : INHERITED(rec, mode) {}
f66ad85
+    typedef Sk4f (SK_VECTORCALL *ProcF)(Sk4f, Sk4f);
f66ad85
+    Sk4fXfermode(const ProcCoeff& rec, SkXfermode::Mode mode, ProcF procf)
f66ad85
+        : INHERITED(rec, mode)
f66ad85
+        , fProcF(procf) {}
f66ad85
 
f66ad85
     void xfer32(SkPMColor dst[], const SkPMColor src[], int n, const SkAlpha aa[]) const override {
f66ad85
-        BlendFn blend;
f66ad85
-        while (n >= 2) {
f66ad85
-            auto d = Sk8f::FromBytes((const uint8_t*)dst) * (1.0f/255),
f66ad85
-                 s = Sk8f::FromBytes((const uint8_t*)src) * (1.0f/255),
f66ad85
-                 b = blend(d, s);
f66ad85
-            if (aa) {
f66ad85
-                auto a255 = Sk8f(aa[0],aa[0],aa[0],aa[0], aa[1],aa[1],aa[1],aa[1]);
f66ad85
-                (b*a255 + d*(Sk8f(255)-a255) + 0.5).toBytes((uint8_t*)dst);
f66ad85
-                aa += 2;
f66ad85
-            } else {
f66ad85
-                (b * 255 + 0.5).toBytes((uint8_t*)dst);
f66ad85
-            }
f66ad85
-            dst += 2;
f66ad85
-            src += 2;
f66ad85
-            n   -= 2;
f66ad85
-        }
f66ad85
-        if (n) {
f66ad85
-            auto d = Sk4f::FromBytes((const uint8_t*)dst) * (1.0f/255),
f66ad85
-                 s = Sk4f::FromBytes((const uint8_t*)src) * (1.0f/255),
f66ad85
-                 b = blend(d, s);
f66ad85
-            if (aa) {
f66ad85
-                auto a255 = Sk4f(aa[0],aa[0],aa[0],aa[0]);
f66ad85
-                (b*a255 + d*(Sk4f(255)-a255) + 0.5).toBytes((uint8_t*)dst);
f66ad85
-                aa++;
f66ad85
-            } else {
f66ad85
-                (b * 255 + 0.5).toBytes((uint8_t*)dst);
f66ad85
-            }
f66ad85
+        for (int i = 0; i < n; i++) {
f66ad85
+            dst[i] = aa ? this->xfer32(dst[i], src[i], aa[i])
f66ad85
+                        : this->xfer32(dst[i], src[i]);
f66ad85
         }
f66ad85
     }
f66ad85
 
f66ad85
     void xfer16(uint16_t dst[], const SkPMColor src[], int n, const SkAlpha aa[]) const override {
f66ad85
         for (int i = 0; i < n; i++) {
f66ad85
-            SkPMColor dst32 = SkPixel16ToPixel32(dst[i]);           // Convert dst up to 8888.
f66ad85
-            this->xfer32(&dst32, src+i, 1, aa ? aa+i : nullptr);    // Blend 1 pixel.
f66ad85
-            dst[i] = SkPixel32ToPixel16(dst32);                     // Repack dst to 565 and store.
f66ad85
+            SkPMColor dst32 = SkPixel16ToPixel32(dst[i]);
f66ad85
+            dst32 = aa ? this->xfer32(dst32, src[i], aa[i])
f66ad85
+                       : this->xfer32(dst32, src[i]);
f66ad85
+            dst[i] = SkPixel32ToPixel16(dst32);
f66ad85
         }
f66ad85
     }
f66ad85
 
f66ad85
 private:
f66ad85
+    static Sk4f Load(SkPMColor c) {
f66ad85
+        return Sk4f::FromBytes((uint8_t*)&c) * Sk4f(1.0f/255);
f66ad85
+    }
f66ad85
+    static SkPMColor Round(const Sk4f& f) {
f66ad85
+        SkPMColor c;
f66ad85
+        (f * Sk4f(255) + Sk4f(0.5f)).toBytes((uint8_t*)&c);
f66ad85
+        return c;
f66ad85
+    }
f66ad85
+    inline SkPMColor xfer32(SkPMColor dst, SkPMColor src) const {
f66ad85
+        return Round(fProcF(Load(dst), Load(src)));
f66ad85
+    }
f66ad85
+
f66ad85
+    inline SkPMColor xfer32(SkPMColor dst, SkPMColor src, SkAlpha aa) const {
f66ad85
+        Sk4f s(Load(src)),
f66ad85
+             d(Load(dst)),
f66ad85
+             b(fProcF(d,s));
f66ad85
+        // We do aa in full float precision before going back down to bytes, because we can!
f66ad85
+        Sk4f a = Sk4f(aa) * Sk4f(1.0f/255);
f66ad85
+        b = b*a + d*(Sk4f(1)-a);
f66ad85
+        return Round(b);
f66ad85
+    }
f66ad85
+
f66ad85
+    ProcF fProcF;
f66ad85
     typedef SkProcCoeffXfermode INHERITED;
f66ad85
 };
f66ad85
 
f66ad85
@@ -327,7 +323,7 @@ static SkXfermode* create_xfermode(const
f66ad85
     #undef CASE
f66ad85
 
f66ad85
 #define CASE(Mode) \
f66ad85
-    case SkXfermode::k##Mode##_Mode: return new FloatXfermode<Mode>(rec, mode)
f66ad85
+    case SkXfermode::k##Mode##_Mode: return new Sk4fXfermode(rec, mode, &Mode)
f66ad85
         CASE(ColorDodge);
f66ad85
         CASE(ColorBurn);
f66ad85
         CASE(SoftLight);