/* * Copyright 2018 Google Inc. * * Use of this source code is governed by a BSD-style license that can be * found in the LICENSE file. */ #include "src/gpu/ganesh/ops/FillRRectOp.h" #include "include/core/SkClipOp.h" #include "include/core/SkMatrix.h" #include "include/core/SkRRect.h" #include "include/core/SkRect.h" #include "include/core/SkRefCnt.h" #include "include/core/SkScalar.h" #include "include/core/SkString.h" #include "include/gpu/ganesh/GrRecordingContext.h" #include "include/private/SkColorData.h" #include "include/private/base/SkAlignedStorage.h" #include "include/private/base/SkAssert.h" #include "include/private/base/SkDebug.h" #include "include/private/base/SkMacros.h" #include "include/private/base/SkOnce.h" #include "include/private/base/SkPoint_impl.h" #include "include/private/base/SkTArray.h" #include "include/private/gpu/ganesh/GrTypesPriv.h" #include "src/base/SkArenaAlloc.h" #include "src/base/SkUtils.h" #include "src/base/SkVx.h" #include "src/core/SkRRectPriv.h" #include "src/core/SkSLTypeShared.h" #include "src/gpu/BufferWriter.h" #include "src/gpu/KeyBuilder.h" #include "src/gpu/ResourceKey.h" #include "src/gpu/ganesh/GrAppliedClip.h" #include "src/gpu/ganesh/GrBuffer.h" #include "src/gpu/ganesh/GrCaps.h" #include "src/gpu/ganesh/GrGeometryProcessor.h" #include "src/gpu/ganesh/GrMeshDrawTarget.h" #include "src/gpu/ganesh/GrOpFlushState.h" #include "src/gpu/ganesh/GrPaint.h" #include "src/gpu/ganesh/GrProcessorAnalysis.h" #include "src/gpu/ganesh/GrProcessorSet.h" #include "src/gpu/ganesh/GrProgramInfo.h" #include "src/gpu/ganesh/GrRecordingContextPriv.h" #include "src/gpu/ganesh/GrResourceProvider.h" #include "src/gpu/ganesh/GrShaderCaps.h" #include "src/gpu/ganesh/GrShaderVar.h" #include "src/gpu/ganesh/geometry/GrShape.h" #include "src/gpu/ganesh/glsl/GrGLSLFragmentShaderBuilder.h" #include "src/gpu/ganesh/glsl/GrGLSLVarying.h" #include "src/gpu/ganesh/glsl/GrGLSLVertexGeoBuilder.h" #include "src/gpu/ganesh/ops/GrDrawOp.h" #include "src/gpu/ganesh/ops/GrMeshDrawOp.h" #include "src/gpu/ganesh/ops/GrSimpleMeshDrawOpHelper.h" #if defined(GPU_TEST_UTILS) #include "src/base/SkRandom.h" #include "src/gpu/ganesh/GrDrawOpTest.h" #include "src/gpu/ganesh/GrTestUtils.h" #endif #include #include #include #include #include #include class GrDstProxyView; class GrGLSLProgramDataManager; class GrSurfaceProxyView; enum class GrXferBarrierFlags; namespace skgpu::ganesh { class SurfaceDrawContext; } using namespace skia_private; namespace skgpu::ganesh::FillRRectOp { namespace { // Note: Just checking m.restStaysRect is not sufficient bool skews_are_relevant(const SkMatrix& m) { SkASSERT(!m.hasPerspective()); if (m[SkMatrix::kMSkewX] == 0.0f && m[SkMatrix::kMSkewY] == 0.0f) { return false; } static constexpr float kTol = SK_ScalarNearlyZero; float absScaleX = SkScalarAbs(m[SkMatrix::kMScaleX]); float absSkewX = SkScalarAbs(m[SkMatrix::kMSkewX]); float absScaleY = SkScalarAbs(m[SkMatrix::kMScaleY]); float absSkewY = SkScalarAbs(m[SkMatrix::kMSkewY]); // The maximum absolute column sum norm of the upper left 2x2 float norm = std::max(absScaleX + absSkewY, absSkewX + absScaleY); return absSkewX > kTol * norm || absSkewY > kTol * norm; } class FillRRectOpImpl final : public GrMeshDrawOp { private: using Helper = GrSimpleMeshDrawOpHelper; public: DEFINE_OP_CLASS_ID struct LocalCoords { enum class Type : bool { kRect, kMatrix }; LocalCoords(const SkRect& localRect) : fType(Type::kRect) , fRect(localRect) {} LocalCoords(const SkMatrix& localMatrix) : fType(Type::kMatrix) , fMatrix(localMatrix) {} Type fType; union { SkRect fRect; SkMatrix fMatrix; }; }; static GrOp::Owner Make(GrRecordingContext*, SkArenaAlloc*, GrPaint&&, const SkMatrix& viewMatrix, const SkRRect&, const LocalCoords&, GrAA); const char* name() const override { return "FillRRectOp"; } FixedFunctionFlags fixedFunctionFlags() const override { return fHelper.fixedFunctionFlags(); } ClipResult clipToShape(skgpu::ganesh::SurfaceDrawContext*, SkClipOp, const SkMatrix& clipMatrix, const GrShape&, GrAA) override; GrProcessorSet::Analysis finalize(const GrCaps&, const GrAppliedClip*, GrClampType) override; CombineResult onCombineIfPossible(GrOp*, SkArenaAlloc*, const GrCaps&) override; #if defined(GPU_TEST_UTILS) SkString onDumpInfo() const override; #endif void visitProxies(const GrVisitProxyFunc& func) const override { if (fProgramInfo) { fProgramInfo->visitFPProxies(func); } else { fHelper.visitProxies(func); } } void onPrepareDraws(GrMeshDrawTarget*) override; void onExecute(GrOpFlushState*, const SkRect& chainBounds) override; private: friend class ::GrSimpleMeshDrawOpHelper; // for access to ctor friend class ::GrOp; // for access to ctor enum class ProcessorFlags { kNone = 0, kUseHWDerivatives = 1 << 0, kHasLocalCoords = 1 << 1, kWideColor = 1 << 2, kMSAAEnabled = 1 << 3, kFakeNonAA = 1 << 4, }; constexpr static int kNumProcessorFlags = 5; SK_DECL_BITFIELD_CLASS_OPS_FRIENDS(ProcessorFlags); class Processor; FillRRectOpImpl(GrProcessorSet*, const SkPMColor4f& paintColor, SkArenaAlloc*, const SkMatrix& viewMatrix, const SkRRect&, const LocalCoords&, ProcessorFlags); GrProgramInfo* programInfo() override { return fProgramInfo; } // Create a GrProgramInfo object in the provided arena void onCreateProgramInfo(const GrCaps*, SkArenaAlloc*, const GrSurfaceProxyView& writeView, bool usesMSAASurface, GrAppliedClip&&, const GrDstProxyView&, GrXferBarrierFlags renderPassXferBarriers, GrLoadOp colorLoadOp) override; Helper fHelper; ProcessorFlags fProcessorFlags; struct Instance { Instance(const SkMatrix& viewMatrix, const SkRRect& rrect, const LocalCoords& localCoords, const SkPMColor4f& color) : fViewMatrix(viewMatrix), fRRect(rrect), fLocalCoords(localCoords), fColor(color) { } SkMatrix fViewMatrix; SkRRect fRRect; LocalCoords fLocalCoords; SkPMColor4f fColor; Instance* fNext = nullptr; }; Instance* fHeadInstance; Instance** fTailInstance; int fInstanceCount = 1; sk_sp fInstanceBuffer; sk_sp fVertexBuffer; sk_sp fIndexBuffer; int fBaseInstance = 0; // If this op is prePrepared the created programInfo will be stored here for use in // onExecute. In the prePrepared case it will have been stored in the record-time arena. GrProgramInfo* fProgramInfo = nullptr; }; SK_MAKE_BITFIELD_CLASS_OPS(FillRRectOpImpl::ProcessorFlags) // Hardware derivatives are not always accurate enough for highly elliptical corners. This method // checks to make sure the corners will still all look good if we use HW derivatives. bool can_use_hw_derivatives_with_coverage(const GrShaderCaps&, const SkMatrix&, const SkRRect&); GrOp::Owner FillRRectOpImpl::Make(GrRecordingContext* ctx, SkArenaAlloc* arena, GrPaint&& paint, const SkMatrix& viewMatrix, const SkRRect& rrect, const LocalCoords& localCoords, GrAA aa) { const GrCaps* caps = ctx->priv().caps(); if (!caps->drawInstancedSupport()) { return nullptr; } // We transform into a normalized -1..+1 space to draw the round rect. If the boundaries are too // large, the math can overflow. The caller can fall back on path rendering if this is the case. if (std::max(rrect.height(), rrect.width()) >= 1e6f) { return nullptr; } ProcessorFlags flags = ProcessorFlags::kNone; // TODO: Support perspective in a follow-on CL. This shouldn't be difficult, since we already // use HW derivatives. The only trick will be adjusting the AA outset to account for // perspective. (i.e., outset = 0.5 * z.) if (viewMatrix.hasPerspective()) { return nullptr; } if (can_use_hw_derivatives_with_coverage(*caps->shaderCaps(), viewMatrix, rrect)) { // HW derivatives (more specifically, fwidth()) are consistently faster on all platforms in // coverage mode. We use them as long as the approximation will be accurate enough. flags |= ProcessorFlags::kUseHWDerivatives; } if (aa == GrAA::kNo) { flags |= ProcessorFlags::kFakeNonAA; } return Helper::FactoryHelper(ctx, std::move(paint), arena, viewMatrix, rrect, localCoords, flags); } FillRRectOpImpl::FillRRectOpImpl(GrProcessorSet* processorSet, const SkPMColor4f& paintColor, SkArenaAlloc* arena, const SkMatrix& viewMatrix, const SkRRect& rrect, const LocalCoords& localCoords, ProcessorFlags processorFlags) : GrMeshDrawOp(ClassID()) , fHelper(processorSet, (processorFlags & ProcessorFlags::kFakeNonAA) ? GrAAType::kNone : GrAAType::kCoverage) // Use analytic AA even if the RT is MSAA. , fProcessorFlags(processorFlags & ~(ProcessorFlags::kHasLocalCoords | ProcessorFlags::kWideColor | ProcessorFlags::kMSAAEnabled)) , fHeadInstance(arena->make(viewMatrix, rrect, localCoords, paintColor)) , fTailInstance(&fHeadInstance->fNext) { // FillRRectOp::Make fails if there is perspective. SkASSERT(!viewMatrix.hasPerspective()); this->setBounds(viewMatrix.mapRect(rrect.getBounds()), GrOp::HasAABloat(!(processorFlags & ProcessorFlags::kFakeNonAA)), GrOp::IsHairline::kNo); } GrDrawOp::ClipResult FillRRectOpImpl::clipToShape(skgpu::ganesh::SurfaceDrawContext* sdc, SkClipOp clipOp, const SkMatrix& clipMatrix, const GrShape& shape, GrAA aa) { SkASSERT(fInstanceCount == 1); // This needs to be called before combining. SkASSERT(fHeadInstance->fNext == nullptr); if ((shape.isRect() || shape.isRRect()) && clipOp == SkClipOp::kIntersect && (aa == GrAA::kNo) == (fProcessorFlags & ProcessorFlags::kFakeNonAA)) { // The clip shape is a round rect. Attempt to map it to a round rect in "viewMatrix" space. SkRRect clipRRect; if (clipMatrix == fHeadInstance->fViewMatrix) { if (shape.isRect()) { clipRRect.setRect(shape.rect()); } else { clipRRect = shape.rrect(); } } else { // Find a matrix that maps from "clipMatrix" space to "viewMatrix" space. SkASSERT(!fHeadInstance->fViewMatrix.hasPerspective()); if (clipMatrix.hasPerspective()) { return ClipResult::kFail; } SkMatrix clipToView; if (!fHeadInstance->fViewMatrix.invert(&clipToView)) { return ClipResult::kClippedOut; } clipToView.preConcat(clipMatrix); SkASSERT(!clipToView.hasPerspective()); if (skews_are_relevant(clipToView)) { // A rect in "clipMatrix" space is not a rect in "viewMatrix" space. return ClipResult::kFail; } clipToView.setSkewX(0); clipToView.setSkewY(0); SkASSERT(clipToView.rectStaysRect()); if (shape.isRect()) { clipRRect.setRect(clipToView.mapRect(shape.rect())); } else { if (!shape.rrect().transform(clipToView, &clipRRect)) { // Transforming the rrect failed. This shouldn't generally happen except in // cases of fp32 overflow. return ClipResult::kFail; } } } // Intersect our round rect with the clip shape. SkRRect isectRRect; if (fHeadInstance->fRRect.isRect() && clipRRect.isRect()) { SkRect isectRect; if (!isectRect.intersect(fHeadInstance->fRRect.rect(), clipRRect.rect())) { return ClipResult::kClippedOut; } isectRRect.setRect(isectRect); } else { isectRRect = SkRRectPriv::ConservativeIntersect(fHeadInstance->fRRect, clipRRect); if (isectRRect.isEmpty()) { // The round rects did not intersect at all or the intersection was too complicated // to compute quickly. return ClipResult::kFail; } } // Don't apply the clip geometrically if it becomes subpixel, since then the hairline // rendering may outset beyond the original clip. SkRect devISectBounds = fHeadInstance->fViewMatrix.mapRect(isectRRect.rect()); if (devISectBounds.width() < 1.f || devISectBounds.height() < 1.f) { return ClipResult::kFail; } if (fHeadInstance->fLocalCoords.fType == LocalCoords::Type::kRect) { // Update the local rect. auto rect = sk_bit_cast(fHeadInstance->fRRect.rect()); auto local = sk_bit_cast(fHeadInstance->fLocalCoords.fRect); auto isect = sk_bit_cast(isectRRect.rect()); auto rectToLocalSize = (local - skvx::shuffle<2,3,0,1>(local)) / (rect - skvx::shuffle<2,3,0,1>(rect)); auto localCoordsRect = (isect - rect) * rectToLocalSize + local; fHeadInstance->fLocalCoords.fRect.setLTRB(localCoordsRect.x(), localCoordsRect.y(), localCoordsRect.z(), localCoordsRect.w()); } // Update the round rect. fHeadInstance->fRRect = isectRRect; return ClipResult::kClippedGeometrically; } return ClipResult::kFail; } GrProcessorSet::Analysis FillRRectOpImpl::finalize(const GrCaps& caps, const GrAppliedClip* clip, GrClampType clampType) { SkASSERT(fInstanceCount == 1); SkASSERT(fHeadInstance->fNext == nullptr); bool isWideColor; auto analysis = fHelper.finalizeProcessors(caps, clip, clampType, GrProcessorAnalysisCoverage::kSingleChannel, &fHeadInstance->fColor, &isWideColor); if (isWideColor) { fProcessorFlags |= ProcessorFlags::kWideColor; } if (analysis.usesLocalCoords()) { fProcessorFlags |= ProcessorFlags::kHasLocalCoords; } return analysis; } GrOp::CombineResult FillRRectOpImpl::onCombineIfPossible(GrOp* op, SkArenaAlloc*, const GrCaps& caps) { auto that = op->cast(); if (!fHelper.isCompatible(that->fHelper, caps, this->bounds(), that->bounds()) || fProcessorFlags != that->fProcessorFlags) { return CombineResult::kCannotCombine; } *fTailInstance = that->fHeadInstance; fTailInstance = that->fTailInstance; fInstanceCount += that->fInstanceCount; return CombineResult::kMerged; } #if defined(GPU_TEST_UTILS) SkString FillRRectOpImpl::onDumpInfo() const { SkString str = SkStringPrintf("# instances: %d\n", fInstanceCount); str += fHelper.dumpInfo(); int i = 0; for (Instance* tmp = fHeadInstance; tmp; tmp = tmp->fNext, ++i) { str.appendf("%d: Color: [%.2f, %.2f, %.2f, %.2f] ", i, tmp->fColor.fR, tmp->fColor.fG, tmp->fColor.fB, tmp->fColor.fA); SkMatrix m = tmp->fViewMatrix; str.appendf("ViewMatrix: [%.2f, %.2f, %.2f, %.2f, %.2f, %.2f, %.2f, %.2f, %.2f] ", m[0], m[1], m[2], m[3], m[4], m[5], m[6], m[7], m[8]); SkRect r = tmp->fRRect.rect(); str.appendf("Rect: [%f %f %f %f]\n", r.fLeft, r.fTop, r.fRight, r.fBottom); } return str; } #endif class FillRRectOpImpl::Processor final : public GrGeometryProcessor { public: static GrGeometryProcessor* Make(SkArenaAlloc* arena, GrAAType aaType, ProcessorFlags flags) { return arena->make([&](void* ptr) { return new (ptr) Processor(aaType, flags); }); } const char* name() const override { return "FillRRectOp::Processor"; } void addToKey(const GrShaderCaps& caps, KeyBuilder* b) const override { b->addBits(kNumProcessorFlags, (uint32_t)fFlags, "flags"); } std::unique_ptr makeProgramImpl(const GrShaderCaps&) const override; private: class Impl; Processor(GrAAType aaType, ProcessorFlags flags) : GrGeometryProcessor(kGrFillRRectOp_Processor_ClassID) , fFlags(flags) { this->setVertexAttributesWithImplicitOffsets(kVertexAttribs, std::size(kVertexAttribs)); fInstanceAttribs.emplace_back("radii_x", kFloat4_GrVertexAttribType, SkSLType::kFloat4); fInstanceAttribs.emplace_back("radii_y", kFloat4_GrVertexAttribType, SkSLType::kFloat4); fInstanceAttribs.emplace_back("skew", kFloat4_GrVertexAttribType, SkSLType::kFloat4); if (fFlags & ProcessorFlags::kHasLocalCoords) { fInstanceAttribs.emplace_back("translate_and_localrotate", kFloat4_GrVertexAttribType, SkSLType::kFloat4); fInstanceAttribs.emplace_back( "localrect", kFloat4_GrVertexAttribType, SkSLType::kFloat4); } else { fInstanceAttribs.emplace_back("translate_and_localrotate", kFloat2_GrVertexAttribType, SkSLType::kFloat2); } fColorAttrib = &fInstanceAttribs.push_back( MakeColorAttribute("color", (fFlags & ProcessorFlags::kWideColor))); SkASSERT(fInstanceAttribs.size() <= kMaxInstanceAttribs); this->setInstanceAttributesWithImplicitOffsets(fInstanceAttribs.begin(), fInstanceAttribs.size()); } inline static constexpr Attribute kVertexAttribs[] = { {"radii_selector", kFloat4_GrVertexAttribType, SkSLType::kFloat4}, {"corner_and_radius_outsets", kFloat4_GrVertexAttribType, SkSLType::kFloat4}, // Coverage only. {"aa_bloat_and_coverage", kFloat4_GrVertexAttribType, SkSLType::kFloat4}}; const ProcessorFlags fFlags; constexpr static int kMaxInstanceAttribs = 6; STArray fInstanceAttribs; const Attribute* fColorAttrib; }; // Our coverage geometry consists of an inset octagon with solid coverage, surrounded by linear // coverage ramps on the horizontal and vertical edges, and "arc coverage" pieces on the diagonal // edges. The Vertex struct tells the shader where to place its vertex within a normalized // ([l, t, r, b] = [-1, -1, +1, +1]) space, and how to calculate coverage. See onEmitCode. struct CoverageVertex { std::array fRadiiSelector; std::array fCorner; std::array fRadiusOutset; std::array fAABloatDirection; float fCoverage; float fIsLinearCoverage; }; // This is the offset (when multiplied by radii) from the corners of a bounding box to the vertices // of its inscribed octagon. We draw the outside portion of arcs with quarter-octagons rather than // rectangles. static constexpr float kOctoOffset = 1/(1 + SK_ScalarRoot2Over2); static constexpr CoverageVertex kVertexData[] = { // Left inset edge. {{{0,0,0,1}}, {{-1,+1}}, {{0,-1}}, {{+1,0}}, 1, 1}, {{{1,0,0,0}}, {{-1,-1}}, {{0,+1}}, {{+1,0}}, 1, 1}, // Top inset edge. {{{1,0,0,0}}, {{-1,-1}}, {{+1,0}}, {{0,+1}}, 1, 1}, {{{0,1,0,0}}, {{+1,-1}}, {{-1,0}}, {{0,+1}}, 1, 1}, // Right inset edge. {{{0,1,0,0}}, {{+1,-1}}, {{0,+1}}, {{-1,0}}, 1, 1}, {{{0,0,1,0}}, {{+1,+1}}, {{0,-1}}, {{-1,0}}, 1, 1}, // Bottom inset edge. {{{0,0,1,0}}, {{+1,+1}}, {{-1,0}}, {{0,-1}}, 1, 1}, {{{0,0,0,1}}, {{-1,+1}}, {{+1,0}}, {{0,-1}}, 1, 1}, // Left outset edge. {{{0,0,0,1}}, {{-1,+1}}, {{0,-1}}, {{-1,0}}, 0, 1}, {{{1,0,0,0}}, {{-1,-1}}, {{0,+1}}, {{-1,0}}, 0, 1}, // Top outset edge. {{{1,0,0,0}}, {{-1,-1}}, {{+1,0}}, {{0,-1}}, 0, 1}, {{{0,1,0,0}}, {{+1,-1}}, {{-1,0}}, {{0,-1}}, 0, 1}, // Right outset edge. {{{0,1,0,0}}, {{+1,-1}}, {{0,+1}}, {{+1,0}}, 0, 1}, {{{0,0,1,0}}, {{+1,+1}}, {{0,-1}}, {{+1,0}}, 0, 1}, // Bottom outset edge. {{{0,0,1,0}}, {{+1,+1}}, {{-1,0}}, {{0,+1}}, 0, 1}, {{{0,0,0,1}}, {{-1,+1}}, {{+1,0}}, {{0,+1}}, 0, 1}, // Top-left corner. {{{1,0,0,0}}, {{-1,-1}}, {{ 0,+1}}, {{-1, 0}}, 0, 0}, {{{1,0,0,0}}, {{-1,-1}}, {{ 0,+1}}, {{+1, 0}}, 1, 0}, {{{1,0,0,0}}, {{-1,-1}}, {{+1, 0}}, {{ 0,+1}}, 1, 0}, {{{1,0,0,0}}, {{-1,-1}}, {{+1, 0}}, {{ 0,-1}}, 0, 0}, {{{1,0,0,0}}, {{-1,-1}}, {{+kOctoOffset,0}}, {{-1,-1}}, 0, 0}, {{{1,0,0,0}}, {{-1,-1}}, {{0,+kOctoOffset}}, {{-1,-1}}, 0, 0}, // Top-right corner. {{{0,1,0,0}}, {{+1,-1}}, {{-1, 0}}, {{ 0,-1}}, 0, 0}, {{{0,1,0,0}}, {{+1,-1}}, {{-1, 0}}, {{ 0,+1}}, 1, 0}, {{{0,1,0,0}}, {{+1,-1}}, {{ 0,+1}}, {{-1, 0}}, 1, 0}, {{{0,1,0,0}}, {{+1,-1}}, {{ 0,+1}}, {{+1, 0}}, 0, 0}, {{{0,1,0,0}}, {{+1,-1}}, {{0,+kOctoOffset}}, {{+1,-1}}, 0, 0}, {{{0,1,0,0}}, {{+1,-1}}, {{-kOctoOffset,0}}, {{+1,-1}}, 0, 0}, // Bottom-right corner. {{{0,0,1,0}}, {{+1,+1}}, {{ 0,-1}}, {{+1, 0}}, 0, 0}, {{{0,0,1,0}}, {{+1,+1}}, {{ 0,-1}}, {{-1, 0}}, 1, 0}, {{{0,0,1,0}}, {{+1,+1}}, {{-1, 0}}, {{ 0,-1}}, 1, 0}, {{{0,0,1,0}}, {{+1,+1}}, {{-1, 0}}, {{ 0,+1}}, 0, 0}, {{{0,0,1,0}}, {{+1,+1}}, {{-kOctoOffset,0}}, {{+1,+1}}, 0, 0}, {{{0,0,1,0}}, {{+1,+1}}, {{0,-kOctoOffset}}, {{+1,+1}}, 0, 0}, // Bottom-left corner. {{{0,0,0,1}}, {{-1,+1}}, {{+1, 0}}, {{ 0,+1}}, 0, 0}, {{{0,0,0,1}}, {{-1,+1}}, {{+1, 0}}, {{ 0,-1}}, 1, 0}, {{{0,0,0,1}}, {{-1,+1}}, {{ 0,-1}}, {{+1, 0}}, 1, 0}, {{{0,0,0,1}}, {{-1,+1}}, {{ 0,-1}}, {{-1, 0}}, 0, 0}, {{{0,0,0,1}}, {{-1,+1}}, {{0,-kOctoOffset}}, {{-1,+1}}, 0, 0}, {{{0,0,0,1}}, {{-1,+1}}, {{+kOctoOffset,0}}, {{-1,+1}}, 0, 0}}; SKGPU_DECLARE_STATIC_UNIQUE_KEY(gVertexBufferKey); static constexpr uint16_t kIndexData[] = { // Inset octagon (solid coverage). 0, 1, 7, 1, 2, 7, 7, 2, 6, 2, 3, 6, 6, 3, 5, 3, 4, 5, // AA borders (linear coverage). 0, 1, 8, 1, 9, 8, 2, 3, 10, 3, 11, 10, 4, 5, 12, 5, 13, 12, 6, 7, 14, 7, 15, 14, // Top-left arc. 16, 17, 21, 17, 21, 18, 21, 18, 20, 18, 20, 19, // Top-right arc. 22, 23, 27, 23, 27, 24, 27, 24, 26, 24, 26, 25, // Bottom-right arc. 28, 29, 33, 29, 33, 30, 33, 30, 32, 30, 32, 31, // Bottom-left arc. 34, 35, 39, 35, 39, 36, 39, 36, 38, 36, 38, 37}; SKGPU_DECLARE_STATIC_UNIQUE_KEY(gIndexBufferKey); void FillRRectOpImpl::onPrepareDraws(GrMeshDrawTarget* target) { if (!fProgramInfo) { this->createProgramInfo(target); } size_t instanceStride = fProgramInfo->geomProc().instanceStride(); if (VertexWriter instanceWriter = target->makeVertexWriter(instanceStride, fInstanceCount, &fInstanceBuffer, &fBaseInstance)) { SkDEBUGCODE(auto end = instanceWriter.mark(instanceStride * fInstanceCount)); for (Instance* i = fHeadInstance; i; i = i->fNext) { auto [l, t, r, b] = i->fRRect.rect(); // Produce a matrix that draws the round rect from normalized [-1, -1, +1, +1] space. SkMatrix m; // Unmap the normalized rect [-1, -1, +1, +1] back to [l, t, r, b]. m.setScaleTranslate((r - l)/2, (b - t)/2, (l + r)/2, (t + b)/2); // Map to device space. m.postConcat(i->fViewMatrix); // Convert the radii to [-1, -1, +1, +1] space and write their attribs. skvx::float4 radiiX, radiiY; skvx::strided_load2(&SkRRectPriv::GetRadiiArray(i->fRRect)->fX, radiiX, radiiY); radiiX *= 2 / (r - l); radiiY *= 2 / (b - t); instanceWriter << radiiX << radiiY << m.getScaleX() << m.getSkewX() << m.getSkewY() << m.getScaleY() << m.getTranslateX() << m.getTranslateY(); if (fProcessorFlags & ProcessorFlags::kHasLocalCoords) { if (i->fLocalCoords.fType == LocalCoords::Type::kRect) { instanceWriter << 0.f << 0.f // localrotate << i->fLocalCoords.fRect; // localrect } else { SkASSERT(i->fLocalCoords.fType == LocalCoords::Type::kMatrix); const SkRect& bounds = i->fRRect.rect(); const SkMatrix& localMatrix = i->fLocalCoords.fMatrix; SkVector u = localMatrix.mapVector(bounds.right() - bounds.left(), 0); SkVector v = localMatrix.mapVector(0, bounds.bottom() - bounds.top()); SkPoint l0 = localMatrix.mapPoint({bounds.left(), bounds.top()}); instanceWriter << v.x() << u.y() // localrotate << l0 << (l0.x() + u.x()) << (l0.y() + v.y()); // localrect } } instanceWriter << VertexColor(i->fColor, fProcessorFlags & ProcessorFlags::kWideColor); } SkASSERT(instanceWriter.mark() == end); } SKGPU_DEFINE_STATIC_UNIQUE_KEY(gIndexBufferKey); fIndexBuffer = target->resourceProvider()->findOrMakeStaticBuffer(GrGpuBufferType::kIndex, sizeof(kIndexData), kIndexData, gIndexBufferKey); SKGPU_DEFINE_STATIC_UNIQUE_KEY(gVertexBufferKey); fVertexBuffer = target->resourceProvider()->findOrMakeStaticBuffer(GrGpuBufferType::kVertex, sizeof(kVertexData), kVertexData, gVertexBufferKey); } class FillRRectOpImpl::Processor::Impl : public ProgramImpl { public: void setData(const GrGLSLProgramDataManager&, const GrShaderCaps&, const GrGeometryProcessor&) override {} private: void onEmitCode(EmitArgs& args, GrGPArgs* gpArgs) override { GrGLSLVertexBuilder* v = args.fVertBuilder; GrGLSLFPFragmentBuilder* f = args.fFragBuilder; const auto& proc = args.fGeomProc.cast(); bool useHWDerivatives = (proc.fFlags & ProcessorFlags::kUseHWDerivatives); SkASSERT(proc.vertexStride() == sizeof(CoverageVertex)); GrGLSLVaryingHandler* varyings = args.fVaryingHandler; varyings->emitAttributes(proc); f->codeAppendf("half4 %s;", args.fOutputColor); varyings->addPassThroughAttribute(proc.fColorAttrib->asShaderVar(), args.fOutputColor, GrGLSLVaryingHandler::Interpolation::kCanBeFlat); // Emit the vertex shader. // When MSAA is enabled, we need to make sure every sample gets lit up on pixels that have // fractional coverage. We do this by making the ramp wider. v->codeAppendf("float aa_bloat_multiplier = %i;", (proc.fFlags & ProcessorFlags::kMSAAEnabled) ? 2 // Outset an entire pixel (2 radii). : (!(proc.fFlags & ProcessorFlags::kFakeNonAA)) ? 1 // Outset one half pixel (1 radius). : 0); // No AA bloat. // Unpack vertex attribs. v->codeAppend("float2 corner = corner_and_radius_outsets.xy;"); v->codeAppend("float2 radius_outset = corner_and_radius_outsets.zw;"); v->codeAppend("float2 aa_bloat_direction = aa_bloat_and_coverage.xy;"); v->codeAppend("float is_linear_coverage = aa_bloat_and_coverage.w;"); // Find the amount to bloat each edge for AA (in source space). v->codeAppend("float2 pixellength = inversesqrt(" "float2(dot(skew.xz, skew.xz), dot(skew.yw, skew.yw)));"); v->codeAppend("float4 normalized_axis_dirs = skew * pixellength.xyxy;"); v->codeAppend("float2 axiswidths = (abs(normalized_axis_dirs.xy) + " "abs(normalized_axis_dirs.zw));"); v->codeAppend("float2 aa_bloatradius = axiswidths * pixellength * .5;"); // Identify our radii. v->codeAppend("float4 radii_and_neighbors = radii_selector" "* float4x4(radii_x, radii_y, radii_x.yxwz, radii_y.wzyx);"); v->codeAppend("float2 radii = radii_and_neighbors.xy;"); v->codeAppend("float2 neighbor_radii = radii_and_neighbors.zw;"); v->codeAppend("float coverage_multiplier = 1;"); v->codeAppend("if (any(greaterThan(aa_bloatradius, float2(1)))) {"); // The rrect is more narrow than a half-pixel AA coverage ramp. We can't // draw as-is or else opposite AA borders will overlap. Instead, fudge the // size up to the width of a coverage ramp, and then reduce total coverage // to make the rect appear more thin. v->codeAppend( "corner = max(abs(corner), aa_bloatradius) * sign(corner);"); v->codeAppend( "coverage_multiplier = 1 / (max(aa_bloatradius.x, 1) * " "max(aa_bloatradius.y, 1));"); // Set radii to zero to ensure we take the "linear coverage" codepath. // (The "coverage" variable only has effect in the linear codepath.) v->codeAppend( "radii = float2(0);"); v->codeAppend("}"); // Unpack coverage. v->codeAppend("float coverage = aa_bloat_and_coverage.z;"); if (proc.fFlags & ProcessorFlags::kMSAAEnabled) { // MSAA has a wider ramp that goes from -.5 to 1.5 instead of 0 to 1. v->codeAppendf("coverage = (coverage - .5) * aa_bloat_multiplier + .5;"); } v->codeAppend("if (any(lessThan(radii, aa_bloatradius * 1.5))) {"); // The radii are very small. Demote this arc to a sharp 90 degree corner. v->codeAppend( "radii = float2(0);"); // Convert to a standard picture frame for an AA rect instead of the round // rect geometry. v->codeAppend( "aa_bloat_direction = sign(corner);"); v->codeAppend( "if (coverage > .5) {"); // Are we an inset edge? v->codeAppend( "aa_bloat_direction = -aa_bloat_direction;"); v->codeAppend( "}"); v->codeAppend( "is_linear_coverage = 1;"); v->codeAppend("} else {"); // Don't let radii get smaller than a coverage ramp plus an extra half // pixel for MSAA. Always use the same amount so we don't pop when // switching between MSAA and coverage. v->codeAppend( "radii = clamp(radii, pixellength * 1.5, 2 - pixellength * 1.5);"); v->codeAppend( "neighbor_radii = clamp(neighbor_radii, pixellength * 1.5, " "2 - pixellength * 1.5);"); // Don't let neighboring radii get closer together than 1/16 pixel. v->codeAppend( "float2 spacing = 2 - radii - neighbor_radii;"); v->codeAppend( "float2 extra_pad = max(pixellength * .0625 - spacing, float2(0));"); v->codeAppend( "radii -= extra_pad * .5;"); v->codeAppend("}"); // Find our vertex position, adjusted for radii and bloated for AA. Our rect is drawn in // normalized [-1,-1,+1,+1] space. v->codeAppend("float2 aa_outset = " "aa_bloat_direction * aa_bloatradius * aa_bloat_multiplier;"); v->codeAppend("float2 vertexpos = corner + radius_outset * radii + aa_outset;"); v->codeAppend("if (coverage > .5) {"); // Are we an inset edge? // Don't allow the aa insets to overlap. i.e., Don't let them inset past // the center (x=y=0). Since we don't allow the rect to become thinner // than 1px, this should only happen when using MSAA, where we inset by an // entire pixel instead of half. v->codeAppend( "if (aa_bloat_direction.x != 0 && vertexpos.x * corner.x < 0) {"); v->codeAppend( "float backset = abs(vertexpos.x);"); v->codeAppend( "vertexpos.x = 0;"); v->codeAppend( "vertexpos.y += " "backset * sign(corner.y) * pixellength.y/pixellength.x;"); v->codeAppend( "coverage = (coverage - .5) * abs(corner.x) / " "(abs(corner.x) + backset) + .5;"); v->codeAppend( "}"); v->codeAppend( "if (aa_bloat_direction.y != 0 && vertexpos.y * corner.y < 0) {"); v->codeAppend( "float backset = abs(vertexpos.y);"); v->codeAppend( "vertexpos.y = 0;"); v->codeAppend( "vertexpos.x += " "backset * sign(corner.x) * pixellength.x/pixellength.y;"); v->codeAppend( "coverage = (coverage - .5) * abs(corner.y) / " "(abs(corner.y) + backset) + .5;"); v->codeAppend( "}"); v->codeAppend("}"); // Transform to device space. v->codeAppend("float2x2 skewmatrix = float2x2(skew.xy, skew.zw);"); v->codeAppend("float2 devcoord = vertexpos * skewmatrix + translate_and_localrotate.xy;"); gpArgs->fPositionVar.set(SkSLType::kFloat2, "devcoord"); // Output local coordinates. if (proc.fFlags & ProcessorFlags::kHasLocalCoords) { // Do math in a way that preserves exact local coord boundaries when there is no local // rotate and vertexpos is on an exact shape boundary. v->codeAppend("float2 T = vertexpos * .5 + .5;"); v->codeAppend("float2 localcoord = localrect.xy * (1 - T) + " "localrect.zw * T + " "translate_and_localrotate.zw * T.yx;"); gpArgs->fLocalCoordVar.set(SkSLType::kFloat2, "localcoord"); } // Setup interpolants for coverage. GrGLSLVarying arcCoord(useHWDerivatives ? SkSLType::kFloat2 : SkSLType::kFloat4); varyings->addVarying("arccoord", &arcCoord); v->codeAppend("if (0 != is_linear_coverage) {"); // We are a non-corner piece: Set x=0 to indicate built-in coverage, and // interpolate linear coverage across y. v->codeAppendf( "%s.xy = float2(0, coverage * coverage_multiplier);", arcCoord.vsOut()); v->codeAppend("} else {"); // Find the normalized arc coordinates for our corner ellipse. // (i.e., the coordinate system where x^2 + y^2 == 1). v->codeAppend( "float2 arccoord = 1 - abs(radius_outset) + aa_outset/radii * corner;"); // We are a corner piece: Interpolate the arc coordinates for coverage. // Emit x+1 to ensure no pixel in the arc has a x value of 0 (since x=0 // instructs the fragment shader to use linear coverage). v->codeAppendf( "%s.xy = float2(arccoord.x+1, arccoord.y);", arcCoord.vsOut()); if (!useHWDerivatives) { // The gradient is order-1: Interpolate it across arccoord.zw. v->codeAppendf("float2x2 derivatives = inverse(skewmatrix);"); v->codeAppendf("%s.zw = derivatives * (arccoord/radii * 2);", arcCoord.vsOut()); } v->codeAppend("}"); // Emit the fragment shader. f->codeAppendf("float x_plus_1=%s.x, y=%s.y;", arcCoord.fsIn(), arcCoord.fsIn()); f->codeAppendf("half coverage;"); f->codeAppendf("if (0 == x_plus_1) {"); f->codeAppendf( "coverage = half(y);"); // We are a non-arc pixel (linear coverage). f->codeAppendf("} else {"); f->codeAppendf( "float fn = x_plus_1 * (x_plus_1 - 2);"); // fn = (x+1)*(x-1) = x^2-1 f->codeAppendf( "fn = fma(y,y, fn);"); // fn = x^2 + y^2 - 1 if (useHWDerivatives) { f->codeAppendf("float fnwidth = fwidth(fn);"); } else { // The gradient is interpolated across arccoord.zw. f->codeAppendf("float gx=%s.z, gy=%s.w;", arcCoord.fsIn(), arcCoord.fsIn()); f->codeAppendf("float fnwidth = abs(gx) + abs(gy);"); } f->codeAppendf( "coverage = .5 - half(fn/fnwidth);"); if (proc.fFlags & ProcessorFlags::kMSAAEnabled) { // MSAA uses ramps larger than 1px, so we need to clamp in both branches. f->codeAppendf("}"); } f->codeAppendf("coverage = clamp(coverage, 0, 1);"); if (!(proc.fFlags & ProcessorFlags::kMSAAEnabled)) { // When not using MSAA, we only need to clamp in the "arc" branch. f->codeAppendf("}"); } if (proc.fFlags & ProcessorFlags::kFakeNonAA) { f->codeAppendf("coverage = (coverage >= .5) ? 1 : 0;"); } f->codeAppendf("half4 %s = half4(coverage);", args.fOutputCoverage); } }; std::unique_ptr FillRRectOpImpl::Processor::makeProgramImpl( const GrShaderCaps&) const { return std::make_unique(); } void FillRRectOpImpl::onCreateProgramInfo(const GrCaps* caps, SkArenaAlloc* arena, const GrSurfaceProxyView& writeView, bool usesMSAASurface, GrAppliedClip&& appliedClip, const GrDstProxyView& dstProxyView, GrXferBarrierFlags renderPassXferBarriers, GrLoadOp colorLoadOp) { if (usesMSAASurface) { fProcessorFlags |= ProcessorFlags::kMSAAEnabled; } GrGeometryProcessor* gp = Processor::Make(arena, fHelper.aaType(), fProcessorFlags); fProgramInfo = fHelper.createProgramInfo(caps, arena, writeView, usesMSAASurface, std::move(appliedClip), dstProxyView, gp, GrPrimitiveType::kTriangles, renderPassXferBarriers, colorLoadOp); } void FillRRectOpImpl::onExecute(GrOpFlushState* flushState, const SkRect& chainBounds) { if (!fInstanceBuffer || !fIndexBuffer || !fVertexBuffer) { return; // Setup failed. } flushState->bindPipelineAndScissorClip(*fProgramInfo, this->bounds()); flushState->bindTextures(fProgramInfo->geomProc(), nullptr, fProgramInfo->pipeline()); flushState->bindBuffers(std::move(fIndexBuffer), std::move(fInstanceBuffer), std::move(fVertexBuffer)); flushState->drawIndexedInstanced(std::size(kIndexData), 0, fInstanceCount, fBaseInstance, 0); } // Will the given corner look good if we use HW derivatives? bool can_use_hw_derivatives_with_coverage(const skvx::float2& devScale, const skvx::float2& cornerRadii) { skvx::float2 devRadii = devScale * cornerRadii; if (devRadii[1] < devRadii[0]) { devRadii = skvx::shuffle<1,0>(devRadii); } float minDevRadius = std::max(devRadii[0], 1.f); // Shader clamps radius at a minimum of 1. // Is the gradient smooth enough for this corner look ok if we use hardware derivatives? // This threshold was arrived at subjevtively on an NVIDIA chip. return minDevRadius * minDevRadius * 5 > devRadii[1]; } bool can_use_hw_derivatives_with_coverage(const skvx::float2& devScale, const SkVector& cornerRadii) { return can_use_hw_derivatives_with_coverage(devScale, skvx::float2::Load(&cornerRadii)); } // Will the given round rect look good if we use HW derivatives? bool can_use_hw_derivatives_with_coverage(const GrShaderCaps& shaderCaps, const SkMatrix& viewMatrix, const SkRRect& rrect) { if (!shaderCaps.fShaderDerivativeSupport) { return false; } auto x = skvx::float2(viewMatrix.getScaleX(), viewMatrix.getSkewX()); auto y = skvx::float2(viewMatrix.getSkewY(), viewMatrix.getScaleY()); skvx::float2 devScale = sqrt(x*x + y*y); switch (rrect.getType()) { case SkRRect::kEmpty_Type: case SkRRect::kRect_Type: return true; case SkRRect::kOval_Type: case SkRRect::kSimple_Type: return can_use_hw_derivatives_with_coverage(devScale, rrect.getSimpleRadii()); case SkRRect::kNinePatch_Type: { skvx::float2 r0 = skvx::float2::Load(SkRRectPriv::GetRadiiArray(rrect)); skvx::float2 r1 = skvx::float2::Load(SkRRectPriv::GetRadiiArray(rrect) + 2); skvx::float2 minRadii = min(r0, r1); skvx::float2 maxRadii = max(r0, r1); return can_use_hw_derivatives_with_coverage(devScale, skvx::float2(minRadii[0], maxRadii[1])) && can_use_hw_derivatives_with_coverage(devScale, skvx::float2(maxRadii[0], minRadii[1])); } case SkRRect::kComplex_Type: { for (int i = 0; i < 4; ++i) { auto corner = static_cast(i); if (!can_use_hw_derivatives_with_coverage(devScale, rrect.radii(corner))) { return false; } } return true; } } SK_ABORT("Invalid round rect type."); } } // anonymous namespace GrOp::Owner Make(GrRecordingContext* ctx, SkArenaAlloc* arena, GrPaint&& paint, const SkMatrix& viewMatrix, const SkRRect& rrect, const SkRect& localRect, GrAA aa) { return FillRRectOpImpl::Make(ctx, arena, std::move(paint), viewMatrix, rrect, localRect, aa); } GrOp::Owner Make(GrRecordingContext* ctx, SkArenaAlloc* arena, GrPaint&& paint, const SkMatrix& viewMatrix, const SkRRect& rrect, const SkMatrix& localMatrix, GrAA aa) { return FillRRectOpImpl::Make(ctx, arena, std::move(paint), viewMatrix, rrect, localMatrix, aa); } } // namespace skgpu::ganesh::FillRRectOp #if defined(GPU_TEST_UTILS) GR_DRAW_OP_TEST_DEFINE(FillRRectOp) { SkArenaAlloc arena(64 * sizeof(float)); SkMatrix viewMatrix = GrTest::TestMatrix(random); GrAA aa = GrAA(random->nextBool()); SkRect rect = GrTest::TestRect(random); float w = rect.width(); float h = rect.height(); SkRRect rrect; // TODO: test out other rrect configurations rrect.setNinePatch(rect, w / 3.0f, h / 4.0f, w / 5.0f, h / 6.0); return skgpu::ganesh::FillRRectOp::Make( context, &arena, std::move(paint), viewMatrix, rrect, rrect.rect(), aa); } #endif