blob: cc4b4a822898190e42927c9429cd2553dbcffb74 [file] [log] [blame]
/*
* Copyright 2018 Google Inc.
*
* Use of this source code is governed by a BSD-style license that can be
* found in the LICENSE file.
*/
#include "src/gpu/ganesh/ops/FillRRectOp.h"
#include "include/gpu/GrRecordingContext.h"
#include "include/private/SkVx.h"
#include "src/core/SkRRectPriv.h"
#include "src/gpu/BufferWriter.h"
#include "src/gpu/KeyBuilder.h"
#include "src/gpu/ganesh/GrCaps.h"
#include "src/gpu/ganesh/GrGeometryProcessor.h"
#include "src/gpu/ganesh/GrMemoryPool.h"
#include "src/gpu/ganesh/GrOpFlushState.h"
#include "src/gpu/ganesh/GrOpsRenderPass.h"
#include "src/gpu/ganesh/GrProgramInfo.h"
#include "src/gpu/ganesh/GrRecordingContextPriv.h"
#include "src/gpu/ganesh/GrResourceProvider.h"
#include "src/gpu/ganesh/geometry/GrShape.h"
#include "src/gpu/ganesh/glsl/GrGLSLFragmentShaderBuilder.h"
#include "src/gpu/ganesh/glsl/GrGLSLVarying.h"
#include "src/gpu/ganesh/glsl/GrGLSLVertexGeoBuilder.h"
#include "src/gpu/ganesh/ops/GrMeshDrawOp.h"
#include "src/gpu/ganesh/ops/GrSimpleMeshDrawOpHelper.h"
namespace skgpu::v1::FillRRectOp {
namespace {
class FillRRectOpImpl final : public GrMeshDrawOp {
private:
using Helper = GrSimpleMeshDrawOpHelper;
public:
DEFINE_OP_CLASS_ID
struct LocalCoords {
enum class Type : bool { kRect, kMatrix };
LocalCoords(const SkRect& localRect)
: fType(Type::kRect)
, fRect(localRect) {}
LocalCoords(const SkMatrix& localMatrix)
: fType(Type::kMatrix)
, fMatrix(localMatrix) {}
Type fType;
union {
SkRect fRect;
SkMatrix fMatrix;
};
};
static GrOp::Owner Make(GrRecordingContext*,
SkArenaAlloc*,
GrPaint&&,
const SkMatrix& viewMatrix,
const SkRRect&,
const LocalCoords&,
GrAA);
const char* name() const override { return "FillRRectOp"; }
FixedFunctionFlags fixedFunctionFlags() const override { return fHelper.fixedFunctionFlags(); }
ClipResult clipToShape(skgpu::v1::SurfaceDrawContext*,
SkClipOp,
const SkMatrix& clipMatrix,
const GrShape&,
GrAA) override;
GrProcessorSet::Analysis finalize(const GrCaps&, const GrAppliedClip*, GrClampType) override;
CombineResult onCombineIfPossible(GrOp*, SkArenaAlloc*, const GrCaps&) override;
void visitProxies(const GrVisitProxyFunc& func) const override {
if (fProgramInfo) {
fProgramInfo->visitFPProxies(func);
} else {
fHelper.visitProxies(func);
}
}
void onPrepareDraws(GrMeshDrawTarget*) override;
void onExecute(GrOpFlushState*, const SkRect& chainBounds) override;
private:
friend class ::GrSimpleMeshDrawOpHelper; // for access to ctor
friend class ::GrOp; // for access to ctor
enum class ProcessorFlags {
kNone = 0,
kUseHWDerivatives = 1 << 0,
kHasLocalCoords = 1 << 1,
kWideColor = 1 << 2,
kMSAAEnabled = 1 << 3,
kFakeNonAA = 1 << 4,
};
constexpr static int kNumProcessorFlags = 5;
GR_DECL_BITFIELD_CLASS_OPS_FRIENDS(ProcessorFlags);
class Processor;
FillRRectOpImpl(GrProcessorSet*,
const SkPMColor4f& paintColor,
SkArenaAlloc*,
const SkMatrix& viewMatrix,
const SkRRect&,
const LocalCoords&,
ProcessorFlags);
GrProgramInfo* programInfo() override { return fProgramInfo; }
// Create a GrProgramInfo object in the provided arena
void onCreateProgramInfo(const GrCaps*,
SkArenaAlloc*,
const GrSurfaceProxyView& writeView,
bool usesMSAASurface,
GrAppliedClip&&,
const GrDstProxyView&,
GrXferBarrierFlags renderPassXferBarriers,
GrLoadOp colorLoadOp) override;
Helper fHelper;
ProcessorFlags fProcessorFlags;
struct Instance {
Instance(const SkMatrix& viewMatrix,
const SkRRect& rrect,
const LocalCoords& localCoords,
const SkPMColor4f& color)
: fViewMatrix(viewMatrix), fRRect(rrect), fLocalCoords(localCoords), fColor(color) {
}
SkMatrix fViewMatrix;
SkRRect fRRect;
LocalCoords fLocalCoords;
SkPMColor4f fColor;
Instance* fNext = nullptr;
};
Instance* fHeadInstance;
Instance** fTailInstance;
int fInstanceCount = 1;
sk_sp<const GrBuffer> fInstanceBuffer;
sk_sp<const GrBuffer> fVertexBuffer;
sk_sp<const GrBuffer> fIndexBuffer;
int fBaseInstance = 0;
// If this op is prePrepared the created programInfo will be stored here for use in
// onExecute. In the prePrepared case it will have been stored in the record-time arena.
GrProgramInfo* fProgramInfo = nullptr;
};
GR_MAKE_BITFIELD_CLASS_OPS(FillRRectOpImpl::ProcessorFlags)
// Hardware derivatives are not always accurate enough for highly elliptical corners. This method
// checks to make sure the corners will still all look good if we use HW derivatives.
bool can_use_hw_derivatives_with_coverage(const GrShaderCaps&,
const SkMatrix&,
const SkRRect&);
GrOp::Owner FillRRectOpImpl::Make(GrRecordingContext* ctx,
SkArenaAlloc* arena,
GrPaint&& paint,
const SkMatrix& viewMatrix,
const SkRRect& rrect,
const LocalCoords& localCoords,
GrAA aa) {
const GrCaps* caps = ctx->priv().caps();
if (!caps->drawInstancedSupport()) {
return nullptr;
}
// We transform into a normalized -1..+1 space to draw the round rect. If the boundaries are too
// large, the math can overflow. The caller can fall back on path rendering if this is the case.
if (std::max(rrect.height(), rrect.width()) >= 1e6f) {
return nullptr;
}
ProcessorFlags flags = ProcessorFlags::kNone;
// TODO: Support perspective in a follow-on CL. This shouldn't be difficult, since we already
// use HW derivatives. The only trick will be adjusting the AA outset to account for
// perspective. (i.e., outset = 0.5 * z.)
if (viewMatrix.hasPerspective()) {
return nullptr;
}
if (can_use_hw_derivatives_with_coverage(*caps->shaderCaps(), viewMatrix, rrect)) {
// HW derivatives (more specifically, fwidth()) are consistently faster on all platforms in
// coverage mode. We use them as long as the approximation will be accurate enough.
flags |= ProcessorFlags::kUseHWDerivatives;
}
if (aa == GrAA::kNo) {
flags |= ProcessorFlags::kFakeNonAA;
}
return Helper::FactoryHelper<FillRRectOpImpl>(ctx, std::move(paint), arena, viewMatrix, rrect,
localCoords, flags);
}
FillRRectOpImpl::FillRRectOpImpl(GrProcessorSet* processorSet,
const SkPMColor4f& paintColor,
SkArenaAlloc* arena,
const SkMatrix& viewMatrix,
const SkRRect& rrect,
const LocalCoords& localCoords,
ProcessorFlags processorFlags)
: GrMeshDrawOp(ClassID())
, fHelper(processorSet,
(processorFlags & ProcessorFlags::kFakeNonAA)
? GrAAType::kNone
: GrAAType::kCoverage) // Use analytic AA even if the RT is MSAA.
, fProcessorFlags(processorFlags & ~(ProcessorFlags::kHasLocalCoords |
ProcessorFlags::kWideColor |
ProcessorFlags::kMSAAEnabled))
, fHeadInstance(arena->make<Instance>(viewMatrix, rrect, localCoords, paintColor))
, fTailInstance(&fHeadInstance->fNext) {
// FillRRectOp::Make fails if there is perspective.
SkASSERT(!viewMatrix.hasPerspective());
this->setBounds(viewMatrix.mapRect(rrect.getBounds()),
GrOp::HasAABloat(!(processorFlags & ProcessorFlags::kFakeNonAA)),
GrOp::IsHairline::kNo);
}
GrDrawOp::ClipResult FillRRectOpImpl::clipToShape(skgpu::v1::SurfaceDrawContext* sdc,
SkClipOp clipOp,
const SkMatrix& clipMatrix,
const GrShape& shape,
GrAA aa) {
SkASSERT(fInstanceCount == 1); // This needs to be called before combining.
SkASSERT(fHeadInstance->fNext == nullptr);
if ((shape.isRect() || shape.isRRect()) &&
clipOp == SkClipOp::kIntersect &&
(aa == GrAA::kNo) == (fProcessorFlags & ProcessorFlags::kFakeNonAA)) {
// The clip shape is a round rect. Attempt to map it to a round rect in "viewMatrix" space.
SkRRect clipRRect;
if (clipMatrix == fHeadInstance->fViewMatrix) {
if (shape.isRect()) {
clipRRect.setRect(shape.rect());
} else {
clipRRect = shape.rrect();
}
} else {
// Find a matrix that maps from "clipMatrix" space to "viewMatrix" space.
SkASSERT(!fHeadInstance->fViewMatrix.hasPerspective());
if (clipMatrix.hasPerspective()) {
return ClipResult::kFail;
}
SkMatrix clipToView;
if (!fHeadInstance->fViewMatrix.invert(&clipToView)) {
return ClipResult::kClippedOut;
}
clipToView.preConcat(clipMatrix);
SkASSERT(!clipToView.hasPerspective());
if (!SkScalarNearlyZero(clipToView.getSkewX()) ||
!SkScalarNearlyZero(clipToView.getSkewY())) {
// A rect in "clipMatrix" space is not a rect in "viewMatrix" space.
return ClipResult::kFail;
}
clipToView.setSkewX(0);
clipToView.setSkewY(0);
SkASSERT(clipToView.rectStaysRect());
if (shape.isRect()) {
clipRRect.setRect(clipToView.mapRect(shape.rect()));
} else {
if (!shape.rrect().transform(clipToView, &clipRRect)) {
// Transforming the rrect failed. This shouldn't generally happen except in
// cases of fp32 overflow.
return ClipResult::kFail;
}
}
}
// Intersect our round rect with the clip shape.
SkRRect isectRRect;
if (fHeadInstance->fRRect.isRect() && clipRRect.isRect()) {
SkRect isectRect;
if (!isectRect.intersect(fHeadInstance->fRRect.rect(), clipRRect.rect())) {
return ClipResult::kClippedOut;
}
isectRRect.setRect(isectRect);
} else {
isectRRect = SkRRectPriv::ConservativeIntersect(fHeadInstance->fRRect, clipRRect);
if (isectRRect.isEmpty()) {
// The round rects did not intersect at all or the intersection was too complicated
// to compute quickly.
return ClipResult::kFail;
}
}
// Don't apply the clip geometrically if it becomes subpixel, since then the hairline
// rendering may outset beyond the original clip.
SkRect devISectBounds = fHeadInstance->fViewMatrix.mapRect(isectRRect.rect());
if (devISectBounds.width() < 1.f || devISectBounds.height() < 1.f) {
return ClipResult::kFail;
}
if (fHeadInstance->fLocalCoords.fType == LocalCoords::Type::kRect) {
// Update the local rect.
auto rect = skvx::bit_pun<skvx::float4>(fHeadInstance->fRRect.rect());
auto local = skvx::bit_pun<skvx::float4>(fHeadInstance->fLocalCoords.fRect);
auto isect = skvx::bit_pun<skvx::float4>(isectRRect.rect());
auto rectToLocalSize = (local - skvx::shuffle<2,3,0,1>(local)) /
(rect - skvx::shuffle<2,3,0,1>(rect));
fHeadInstance->fLocalCoords.fRect =
skvx::bit_pun<SkRect>((isect - rect) * rectToLocalSize + local);
}
// Update the round rect.
fHeadInstance->fRRect = isectRRect;
return ClipResult::kClippedGeometrically;
}
return ClipResult::kFail;
}
GrProcessorSet::Analysis FillRRectOpImpl::finalize(const GrCaps& caps, const GrAppliedClip* clip,
GrClampType clampType) {
SkASSERT(fInstanceCount == 1);
SkASSERT(fHeadInstance->fNext == nullptr);
bool isWideColor;
auto analysis = fHelper.finalizeProcessors(caps, clip, clampType,
GrProcessorAnalysisCoverage::kSingleChannel,
&fHeadInstance->fColor, &isWideColor);
if (isWideColor) {
fProcessorFlags |= ProcessorFlags::kWideColor;
}
if (analysis.usesLocalCoords()) {
fProcessorFlags |= ProcessorFlags::kHasLocalCoords;
}
return analysis;
}
GrOp::CombineResult FillRRectOpImpl::onCombineIfPossible(GrOp* op,
SkArenaAlloc*,
const GrCaps& caps) {
auto that = op->cast<FillRRectOpImpl>();
if (!fHelper.isCompatible(that->fHelper, caps, this->bounds(), that->bounds()) ||
fProcessorFlags != that->fProcessorFlags) {
return CombineResult::kCannotCombine;
}
*fTailInstance = that->fHeadInstance;
fTailInstance = that->fTailInstance;
fInstanceCount += that->fInstanceCount;
return CombineResult::kMerged;
}
class FillRRectOpImpl::Processor final : public GrGeometryProcessor {
public:
static GrGeometryProcessor* Make(SkArenaAlloc* arena, GrAAType aaType, ProcessorFlags flags) {
return arena->make([&](void* ptr) {
return new (ptr) Processor(aaType, flags);
});
}
const char* name() const override { return "FillRRectOp::Processor"; }
void addToKey(const GrShaderCaps& caps, KeyBuilder* b) const override {
b->addBits(kNumProcessorFlags, (uint32_t)fFlags, "flags");
}
std::unique_ptr<ProgramImpl> makeProgramImpl(const GrShaderCaps&) const override;
private:
class Impl;
Processor(GrAAType aaType, ProcessorFlags flags)
: GrGeometryProcessor(kGrFillRRectOp_Processor_ClassID)
, fFlags(flags) {
this->setVertexAttributesWithImplicitOffsets(kVertexAttribs, std::size(kVertexAttribs));
fInstanceAttribs.emplace_back("radii_x", kFloat4_GrVertexAttribType, SkSLType::kFloat4);
fInstanceAttribs.emplace_back("radii_y", kFloat4_GrVertexAttribType, SkSLType::kFloat4);
fInstanceAttribs.emplace_back("skew", kFloat4_GrVertexAttribType, SkSLType::kFloat4);
if (fFlags & ProcessorFlags::kHasLocalCoords) {
fInstanceAttribs.emplace_back("translate_and_localrotate",
kFloat4_GrVertexAttribType,
SkSLType::kFloat4);
fInstanceAttribs.emplace_back(
"localrect", kFloat4_GrVertexAttribType, SkSLType::kFloat4);
} else {
fInstanceAttribs.emplace_back("translate_and_localrotate",
kFloat2_GrVertexAttribType,
SkSLType::kFloat2);
}
fColorAttrib = &fInstanceAttribs.push_back(
MakeColorAttribute("color", (fFlags & ProcessorFlags::kWideColor)));
SkASSERT(fInstanceAttribs.count() <= kMaxInstanceAttribs);
this->setInstanceAttributesWithImplicitOffsets(fInstanceAttribs.begin(),
fInstanceAttribs.count());
}
inline static constexpr Attribute kVertexAttribs[] = {
{"radii_selector", kFloat4_GrVertexAttribType, SkSLType::kFloat4},
{"corner_and_radius_outsets", kFloat4_GrVertexAttribType, SkSLType::kFloat4},
// Coverage only.
{"aa_bloat_and_coverage", kFloat4_GrVertexAttribType, SkSLType::kFloat4}};
const ProcessorFlags fFlags;
constexpr static int kMaxInstanceAttribs = 6;
SkSTArray<kMaxInstanceAttribs, Attribute> fInstanceAttribs;
const Attribute* fColorAttrib;
};
// Our coverage geometry consists of an inset octagon with solid coverage, surrounded by linear
// coverage ramps on the horizontal and vertical edges, and "arc coverage" pieces on the diagonal
// edges. The Vertex struct tells the shader where to place its vertex within a normalized
// ([l, t, r, b] = [-1, -1, +1, +1]) space, and how to calculate coverage. See onEmitCode.
struct CoverageVertex {
std::array<float, 4> fRadiiSelector;
std::array<float, 2> fCorner;
std::array<float, 2> fRadiusOutset;
std::array<float, 2> fAABloatDirection;
float fCoverage;
float fIsLinearCoverage;
};
// This is the offset (when multiplied by radii) from the corners of a bounding box to the vertices
// of its inscribed octagon. We draw the outside portion of arcs with quarter-octagons rather than
// rectangles.
static constexpr float kOctoOffset = 1/(1 + SK_ScalarRoot2Over2);
static constexpr CoverageVertex kVertexData[] = {
// Left inset edge.
{{{0,0,0,1}}, {{-1,+1}}, {{0,-1}}, {{+1,0}}, 1, 1},
{{{1,0,0,0}}, {{-1,-1}}, {{0,+1}}, {{+1,0}}, 1, 1},
// Top inset edge.
{{{1,0,0,0}}, {{-1,-1}}, {{+1,0}}, {{0,+1}}, 1, 1},
{{{0,1,0,0}}, {{+1,-1}}, {{-1,0}}, {{0,+1}}, 1, 1},
// Right inset edge.
{{{0,1,0,0}}, {{+1,-1}}, {{0,+1}}, {{-1,0}}, 1, 1},
{{{0,0,1,0}}, {{+1,+1}}, {{0,-1}}, {{-1,0}}, 1, 1},
// Bottom inset edge.
{{{0,0,1,0}}, {{+1,+1}}, {{-1,0}}, {{0,-1}}, 1, 1},
{{{0,0,0,1}}, {{-1,+1}}, {{+1,0}}, {{0,-1}}, 1, 1},
// Left outset edge.
{{{0,0,0,1}}, {{-1,+1}}, {{0,-1}}, {{-1,0}}, 0, 1},
{{{1,0,0,0}}, {{-1,-1}}, {{0,+1}}, {{-1,0}}, 0, 1},
// Top outset edge.
{{{1,0,0,0}}, {{-1,-1}}, {{+1,0}}, {{0,-1}}, 0, 1},
{{{0,1,0,0}}, {{+1,-1}}, {{-1,0}}, {{0,-1}}, 0, 1},
// Right outset edge.
{{{0,1,0,0}}, {{+1,-1}}, {{0,+1}}, {{+1,0}}, 0, 1},
{{{0,0,1,0}}, {{+1,+1}}, {{0,-1}}, {{+1,0}}, 0, 1},
// Bottom outset edge.
{{{0,0,1,0}}, {{+1,+1}}, {{-1,0}}, {{0,+1}}, 0, 1},
{{{0,0,0,1}}, {{-1,+1}}, {{+1,0}}, {{0,+1}}, 0, 1},
// Top-left corner.
{{{1,0,0,0}}, {{-1,-1}}, {{ 0,+1}}, {{-1, 0}}, 0, 0},
{{{1,0,0,0}}, {{-1,-1}}, {{ 0,+1}}, {{+1, 0}}, 1, 0},
{{{1,0,0,0}}, {{-1,-1}}, {{+1, 0}}, {{ 0,+1}}, 1, 0},
{{{1,0,0,0}}, {{-1,-1}}, {{+1, 0}}, {{ 0,-1}}, 0, 0},
{{{1,0,0,0}}, {{-1,-1}}, {{+kOctoOffset,0}}, {{-1,-1}}, 0, 0},
{{{1,0,0,0}}, {{-1,-1}}, {{0,+kOctoOffset}}, {{-1,-1}}, 0, 0},
// Top-right corner.
{{{0,1,0,0}}, {{+1,-1}}, {{-1, 0}}, {{ 0,-1}}, 0, 0},
{{{0,1,0,0}}, {{+1,-1}}, {{-1, 0}}, {{ 0,+1}}, 1, 0},
{{{0,1,0,0}}, {{+1,-1}}, {{ 0,+1}}, {{-1, 0}}, 1, 0},
{{{0,1,0,0}}, {{+1,-1}}, {{ 0,+1}}, {{+1, 0}}, 0, 0},
{{{0,1,0,0}}, {{+1,-1}}, {{0,+kOctoOffset}}, {{+1,-1}}, 0, 0},
{{{0,1,0,0}}, {{+1,-1}}, {{-kOctoOffset,0}}, {{+1,-1}}, 0, 0},
// Bottom-right corner.
{{{0,0,1,0}}, {{+1,+1}}, {{ 0,-1}}, {{+1, 0}}, 0, 0},
{{{0,0,1,0}}, {{+1,+1}}, {{ 0,-1}}, {{-1, 0}}, 1, 0},
{{{0,0,1,0}}, {{+1,+1}}, {{-1, 0}}, {{ 0,-1}}, 1, 0},
{{{0,0,1,0}}, {{+1,+1}}, {{-1, 0}}, {{ 0,+1}}, 0, 0},
{{{0,0,1,0}}, {{+1,+1}}, {{-kOctoOffset,0}}, {{+1,+1}}, 0, 0},
{{{0,0,1,0}}, {{+1,+1}}, {{0,-kOctoOffset}}, {{+1,+1}}, 0, 0},
// Bottom-left corner.
{{{0,0,0,1}}, {{-1,+1}}, {{+1, 0}}, {{ 0,+1}}, 0, 0},
{{{0,0,0,1}}, {{-1,+1}}, {{+1, 0}}, {{ 0,-1}}, 1, 0},
{{{0,0,0,1}}, {{-1,+1}}, {{ 0,-1}}, {{+1, 0}}, 1, 0},
{{{0,0,0,1}}, {{-1,+1}}, {{ 0,-1}}, {{-1, 0}}, 0, 0},
{{{0,0,0,1}}, {{-1,+1}}, {{0,-kOctoOffset}}, {{-1,+1}}, 0, 0},
{{{0,0,0,1}}, {{-1,+1}}, {{+kOctoOffset,0}}, {{-1,+1}}, 0, 0}};
SKGPU_DECLARE_STATIC_UNIQUE_KEY(gVertexBufferKey);
static constexpr uint16_t kIndexData[] = {
// Inset octagon (solid coverage).
0, 1, 7,
1, 2, 7,
7, 2, 6,
2, 3, 6,
6, 3, 5,
3, 4, 5,
// AA borders (linear coverage).
0, 1, 8, 1, 9, 8,
2, 3, 10, 3, 11, 10,
4, 5, 12, 5, 13, 12,
6, 7, 14, 7, 15, 14,
// Top-left arc.
16, 17, 21,
17, 21, 18,
21, 18, 20,
18, 20, 19,
// Top-right arc.
22, 23, 27,
23, 27, 24,
27, 24, 26,
24, 26, 25,
// Bottom-right arc.
28, 29, 33,
29, 33, 30,
33, 30, 32,
30, 32, 31,
// Bottom-left arc.
34, 35, 39,
35, 39, 36,
39, 36, 38,
36, 38, 37};
SKGPU_DECLARE_STATIC_UNIQUE_KEY(gIndexBufferKey);
void FillRRectOpImpl::onPrepareDraws(GrMeshDrawTarget* target) {
if (!fProgramInfo) {
this->createProgramInfo(target);
}
size_t instanceStride = fProgramInfo->geomProc().instanceStride();
if (VertexWriter instanceWriter = target->makeVertexWriter(instanceStride, fInstanceCount,
&fInstanceBuffer, &fBaseInstance)) {
SkDEBUGCODE(auto end = instanceWriter.mark(instanceStride * fInstanceCount));
for (Instance* i = fHeadInstance; i; i = i->fNext) {
auto [l, t, r, b] = i->fRRect.rect();
// Produce a matrix that draws the round rect from normalized [-1, -1, +1, +1] space.
SkMatrix m;
// Unmap the normalized rect [-1, -1, +1, +1] back to [l, t, r, b].
m.setScaleTranslate((r - l)/2, (b - t)/2, (l + r)/2, (t + b)/2);
// Map to device space.
m.postConcat(i->fViewMatrix);
// Convert the radii to [-1, -1, +1, +1] space and write their attribs.
skvx::float4 radiiX, radiiY;
skvx::strided_load2(&SkRRectPriv::GetRadiiArray(i->fRRect)->fX, radiiX, radiiY);
radiiX *= 2 / (r - l);
radiiY *= 2 / (b - t);
instanceWriter << radiiX << radiiY
<< m.getScaleX() << m.getSkewX() << m.getSkewY() << m.getScaleY()
<< m.getTranslateX() << m.getTranslateY();
if (fProcessorFlags & ProcessorFlags::kHasLocalCoords) {
if (i->fLocalCoords.fType == LocalCoords::Type::kRect) {
instanceWriter << 0.f << 0.f // localrotate
<< i->fLocalCoords.fRect; // localrect
} else {
SkASSERT(i->fLocalCoords.fType == LocalCoords::Type::kMatrix);
const SkRect& bounds = i->fRRect.rect();
const SkMatrix& localMatrix = i->fLocalCoords.fMatrix;
SkVector u = localMatrix.mapVector(bounds.right() - bounds.left(), 0);
SkVector v = localMatrix.mapVector(0, bounds.bottom() - bounds.top());
SkPoint l0 = localMatrix.mapPoint({bounds.left(), bounds.top()});
instanceWriter << v.x() << u.y() // localrotate
<< l0 << (l0.x() + u.x()) << (l0.y() + v.y()); // localrect
}
}
instanceWriter << VertexColor(i->fColor, fProcessorFlags & ProcessorFlags::kWideColor);
}
SkASSERT(instanceWriter.mark() == end);
}
SKGPU_DEFINE_STATIC_UNIQUE_KEY(gIndexBufferKey);
fIndexBuffer = target->resourceProvider()->findOrMakeStaticBuffer(GrGpuBufferType::kIndex,
sizeof(kIndexData),
kIndexData, gIndexBufferKey);
SKGPU_DEFINE_STATIC_UNIQUE_KEY(gVertexBufferKey);
fVertexBuffer = target->resourceProvider()->findOrMakeStaticBuffer(GrGpuBufferType::kVertex,
sizeof(kVertexData),
kVertexData,
gVertexBufferKey);
}
class FillRRectOpImpl::Processor::Impl : public ProgramImpl {
public:
void setData(const GrGLSLProgramDataManager&,
const GrShaderCaps&,
const GrGeometryProcessor&) override {}
private:
void onEmitCode(EmitArgs& args, GrGPArgs* gpArgs) override {
GrGLSLVertexBuilder* v = args.fVertBuilder;
GrGLSLFPFragmentBuilder* f = args.fFragBuilder;
const auto& proc = args.fGeomProc.cast<Processor>();
bool useHWDerivatives = (proc.fFlags & ProcessorFlags::kUseHWDerivatives);
SkASSERT(proc.vertexStride() == sizeof(CoverageVertex));
GrGLSLVaryingHandler* varyings = args.fVaryingHandler;
varyings->emitAttributes(proc);
f->codeAppendf("half4 %s;", args.fOutputColor);
varyings->addPassThroughAttribute(proc.fColorAttrib->asShaderVar(),
args.fOutputColor,
GrGLSLVaryingHandler::Interpolation::kCanBeFlat);
// Emit the vertex shader.
// When MSAA is enabled, we need to make sure every sample gets lit up on pixels that have
// fractional coverage. We do this by making the ramp wider.
v->codeAppendf("float aa_bloat_multiplier = %i;",
(proc.fFlags & ProcessorFlags::kMSAAEnabled)
? 2 // Outset an entire pixel (2 radii).
: (!(proc.fFlags & ProcessorFlags::kFakeNonAA))
? 1 // Outset one half pixel (1 radius).
: 0); // No AA bloat.
// Unpack vertex attribs.
v->codeAppend("float2 corner = corner_and_radius_outsets.xy;");
v->codeAppend("float2 radius_outset = corner_and_radius_outsets.zw;");
v->codeAppend("float2 aa_bloat_direction = aa_bloat_and_coverage.xy;");
v->codeAppend("float is_linear_coverage = aa_bloat_and_coverage.w;");
// Find the amount to bloat each edge for AA (in source space).
v->codeAppend("float2 pixellength = inversesqrt("
"float2(dot(skew.xz, skew.xz), dot(skew.yw, skew.yw)));");
v->codeAppend("float4 normalized_axis_dirs = skew * pixellength.xyxy;");
v->codeAppend("float2 axiswidths = (abs(normalized_axis_dirs.xy) + "
"abs(normalized_axis_dirs.zw));");
v->codeAppend("float2 aa_bloatradius = axiswidths * pixellength * .5;");
// Identify our radii.
v->codeAppend("float4 radii_and_neighbors = radii_selector"
"* float4x4(radii_x, radii_y, radii_x.yxwz, radii_y.wzyx);");
v->codeAppend("float2 radii = radii_and_neighbors.xy;");
v->codeAppend("float2 neighbor_radii = radii_and_neighbors.zw;");
v->codeAppend("float coverage_multiplier = 1;");
v->codeAppend("if (any(greaterThan(aa_bloatradius, float2(1)))) {");
// The rrect is more narrow than a half-pixel AA coverage ramp. We can't
// draw as-is or else opposite AA borders will overlap. Instead, fudge the
// size up to the width of a coverage ramp, and then reduce total coverage
// to make the rect appear more thin.
v->codeAppend( "corner = max(abs(corner), aa_bloatradius) * sign(corner);");
v->codeAppend( "coverage_multiplier = 1 / (max(aa_bloatradius.x, 1) * "
"max(aa_bloatradius.y, 1));");
// Set radii to zero to ensure we take the "linear coverage" codepath.
// (The "coverage" variable only has effect in the linear codepath.)
v->codeAppend( "radii = float2(0);");
v->codeAppend("}");
// Unpack coverage.
v->codeAppend("float coverage = aa_bloat_and_coverage.z;");
if (proc.fFlags & ProcessorFlags::kMSAAEnabled) {
// MSAA has a wider ramp that goes from -.5 to 1.5 instead of 0 to 1.
v->codeAppendf("coverage = (coverage - .5) * aa_bloat_multiplier + .5;");
}
v->codeAppend("if (any(lessThan(radii, aa_bloatradius * 1.5))) {");
// The radii are very small. Demote this arc to a sharp 90 degree corner.
v->codeAppend( "radii = float2(0);");
// Convert to a standard picture frame for an AA rect instead of the round
// rect geometry.
v->codeAppend( "aa_bloat_direction = sign(corner);");
v->codeAppend( "if (coverage > .5) {"); // Are we an inset edge?
v->codeAppend( "aa_bloat_direction = -aa_bloat_direction;");
v->codeAppend( "}");
v->codeAppend( "is_linear_coverage = 1;");
v->codeAppend("} else {");
// Don't let radii get smaller than a coverage ramp plus an extra half
// pixel for MSAA. Always use the same amount so we don't pop when
// switching between MSAA and coverage.
v->codeAppend( "radii = clamp(radii, pixellength * 1.5, 2 - pixellength * 1.5);");
v->codeAppend( "neighbor_radii = clamp(neighbor_radii, pixellength * 1.5, "
"2 - pixellength * 1.5);");
// Don't let neighboring radii get closer together than 1/16 pixel.
v->codeAppend( "float2 spacing = 2 - radii - neighbor_radii;");
v->codeAppend( "float2 extra_pad = max(pixellength * .0625 - spacing, float2(0));");
v->codeAppend( "radii -= extra_pad * .5;");
v->codeAppend("}");
// Find our vertex position, adjusted for radii and bloated for AA. Our rect is drawn in
// normalized [-1,-1,+1,+1] space.
v->codeAppend("float2 aa_outset = "
"aa_bloat_direction * aa_bloatradius * aa_bloat_multiplier;");
v->codeAppend("float2 vertexpos = corner + radius_outset * radii + aa_outset;");
v->codeAppend("if (coverage > .5) {"); // Are we an inset edge?
// Don't allow the aa insets to overlap. i.e., Don't let them inset past
// the center (x=y=0). Since we don't allow the rect to become thinner
// than 1px, this should only happen when using MSAA, where we inset by an
// entire pixel instead of half.
v->codeAppend( "if (aa_bloat_direction.x != 0 && vertexpos.x * corner.x < 0) {");
v->codeAppend( "float backset = abs(vertexpos.x);");
v->codeAppend( "vertexpos.x = 0;");
v->codeAppend( "vertexpos.y += "
"backset * sign(corner.y) * pixellength.y/pixellength.x;");
v->codeAppend( "coverage = (coverage - .5) * abs(corner.x) / "
"(abs(corner.x) + backset) + .5;");
v->codeAppend( "}");
v->codeAppend( "if (aa_bloat_direction.y != 0 && vertexpos.y * corner.y < 0) {");
v->codeAppend( "float backset = abs(vertexpos.y);");
v->codeAppend( "vertexpos.y = 0;");
v->codeAppend( "vertexpos.x += "
"backset * sign(corner.x) * pixellength.x/pixellength.y;");
v->codeAppend( "coverage = (coverage - .5) * abs(corner.y) / "
"(abs(corner.y) + backset) + .5;");
v->codeAppend( "}");
v->codeAppend("}");
// Transform to device space.
v->codeAppend("float2x2 skewmatrix = float2x2(skew.xy, skew.zw);");
v->codeAppend("float2 devcoord = vertexpos * skewmatrix + translate_and_localrotate.xy;");
gpArgs->fPositionVar.set(SkSLType::kFloat2, "devcoord");
// Output local coordinates.
if (proc.fFlags & ProcessorFlags::kHasLocalCoords) {
// Do math in a way that preserves exact local coord boundaries when there is no local
// rotate and vertexpos is on an exact shape boundary.
v->codeAppend("float2 T = vertexpos * .5 + .5;");
v->codeAppend("float2 localcoord = localrect.xy * (1 - T) + "
"localrect.zw * T + "
"translate_and_localrotate.zw * T.yx;");
gpArgs->fLocalCoordVar.set(SkSLType::kFloat2, "localcoord");
}
// Setup interpolants for coverage.
GrGLSLVarying arcCoord(useHWDerivatives ? SkSLType::kFloat2 : SkSLType::kFloat4);
varyings->addVarying("arccoord", &arcCoord);
v->codeAppend("if (0 != is_linear_coverage) {");
// We are a non-corner piece: Set x=0 to indicate built-in coverage, and
// interpolate linear coverage across y.
v->codeAppendf( "%s.xy = float2(0, coverage * coverage_multiplier);",
arcCoord.vsOut());
v->codeAppend("} else {");
// Find the normalized arc coordinates for our corner ellipse.
// (i.e., the coordinate system where x^2 + y^2 == 1).
v->codeAppend( "float2 arccoord = 1 - abs(radius_outset) + aa_outset/radii * corner;");
// We are a corner piece: Interpolate the arc coordinates for coverage.
// Emit x+1 to ensure no pixel in the arc has a x value of 0 (since x=0
// instructs the fragment shader to use linear coverage).
v->codeAppendf( "%s.xy = float2(arccoord.x+1, arccoord.y);", arcCoord.vsOut());
if (!useHWDerivatives) {
// The gradient is order-1: Interpolate it across arccoord.zw.
v->codeAppendf("float2x2 derivatives = inverse(skewmatrix);");
v->codeAppendf("%s.zw = derivatives * (arccoord/radii * 2);", arcCoord.vsOut());
}
v->codeAppend("}");
// Emit the fragment shader.
f->codeAppendf("float x_plus_1=%s.x, y=%s.y;", arcCoord.fsIn(), arcCoord.fsIn());
f->codeAppendf("half coverage;");
f->codeAppendf("if (0 == x_plus_1) {");
f->codeAppendf( "coverage = half(y);"); // We are a non-arc pixel (linear coverage).
f->codeAppendf("} else {");
f->codeAppendf( "float fn = x_plus_1 * (x_plus_1 - 2);"); // fn = (x+1)*(x-1) = x^2-1
f->codeAppendf( "fn = fma(y,y, fn);"); // fn = x^2 + y^2 - 1
if (useHWDerivatives) {
f->codeAppendf("float fnwidth = fwidth(fn);");
} else {
// The gradient is interpolated across arccoord.zw.
f->codeAppendf("float gx=%s.z, gy=%s.w;", arcCoord.fsIn(), arcCoord.fsIn());
f->codeAppendf("float fnwidth = abs(gx) + abs(gy);");
}
f->codeAppendf( "coverage = .5 - half(fn/fnwidth);");
if (proc.fFlags & ProcessorFlags::kMSAAEnabled) {
// MSAA uses ramps larger than 1px, so we need to clamp in both branches.
f->codeAppendf("}");
}
f->codeAppendf("coverage = clamp(coverage, 0, 1);");
if (!(proc.fFlags & ProcessorFlags::kMSAAEnabled)) {
// When not using MSAA, we only need to clamp in the "arc" branch.
f->codeAppendf("}");
}
if (proc.fFlags & ProcessorFlags::kFakeNonAA) {
f->codeAppendf("coverage = (coverage >= .5) ? 1 : 0;");
}
f->codeAppendf("half4 %s = half4(coverage);", args.fOutputCoverage);
}
};
std::unique_ptr<GrGeometryProcessor::ProgramImpl> FillRRectOpImpl::Processor::makeProgramImpl(
const GrShaderCaps&) const {
return std::make_unique<Impl>();
}
void FillRRectOpImpl::onCreateProgramInfo(const GrCaps* caps,
SkArenaAlloc* arena,
const GrSurfaceProxyView& writeView,
bool usesMSAASurface,
GrAppliedClip&& appliedClip,
const GrDstProxyView& dstProxyView,
GrXferBarrierFlags renderPassXferBarriers,
GrLoadOp colorLoadOp) {
if (usesMSAASurface) {
fProcessorFlags |= ProcessorFlags::kMSAAEnabled;
}
GrGeometryProcessor* gp = Processor::Make(arena, fHelper.aaType(), fProcessorFlags);
fProgramInfo = fHelper.createProgramInfo(caps, arena, writeView, usesMSAASurface,
std::move(appliedClip), dstProxyView, gp,
GrPrimitiveType::kTriangles, renderPassXferBarriers,
colorLoadOp);
}
void FillRRectOpImpl::onExecute(GrOpFlushState* flushState, const SkRect& chainBounds) {
if (!fInstanceBuffer || !fIndexBuffer || !fVertexBuffer) {
return; // Setup failed.
}
flushState->bindPipelineAndScissorClip(*fProgramInfo, this->bounds());
flushState->bindTextures(fProgramInfo->geomProc(), nullptr, fProgramInfo->pipeline());
flushState->bindBuffers(std::move(fIndexBuffer), std::move(fInstanceBuffer),
std::move(fVertexBuffer));
flushState->drawIndexedInstanced(std::size(kIndexData), 0, fInstanceCount, fBaseInstance, 0);
}
// Will the given corner look good if we use HW derivatives?
bool can_use_hw_derivatives_with_coverage(const skvx::float2& devScale,
const skvx::float2& cornerRadii) {
skvx::float2 devRadii = devScale * cornerRadii;
if (devRadii[1] < devRadii[0]) {
devRadii = skvx::shuffle<1,0>(devRadii);
}
float minDevRadius = std::max(devRadii[0], 1.f); // Shader clamps radius at a minimum of 1.
// Is the gradient smooth enough for this corner look ok if we use hardware derivatives?
// This threshold was arrived at subjevtively on an NVIDIA chip.
return minDevRadius * minDevRadius * 5 > devRadii[1];
}
bool can_use_hw_derivatives_with_coverage(const skvx::float2& devScale,
const SkVector& cornerRadii) {
return can_use_hw_derivatives_with_coverage(devScale, skvx::float2::Load(&cornerRadii));
}
// Will the given round rect look good if we use HW derivatives?
bool can_use_hw_derivatives_with_coverage(const GrShaderCaps& shaderCaps,
const SkMatrix& viewMatrix,
const SkRRect& rrect) {
if (!shaderCaps.fShaderDerivativeSupport) {
return false;
}
auto x = skvx::float2(viewMatrix.getScaleX(), viewMatrix.getSkewX());
auto y = skvx::float2(viewMatrix.getSkewY(), viewMatrix.getScaleY());
skvx::float2 devScale = sqrt(x*x + y*y);
switch (rrect.getType()) {
case SkRRect::kEmpty_Type:
case SkRRect::kRect_Type:
return true;
case SkRRect::kOval_Type:
case SkRRect::kSimple_Type:
return can_use_hw_derivatives_with_coverage(devScale, rrect.getSimpleRadii());
case SkRRect::kNinePatch_Type: {
skvx::float2 r0 = skvx::float2::Load(SkRRectPriv::GetRadiiArray(rrect));
skvx::float2 r1 = skvx::float2::Load(SkRRectPriv::GetRadiiArray(rrect) + 2);
skvx::float2 minRadii = min(r0, r1);
skvx::float2 maxRadii = max(r0, r1);
return can_use_hw_derivatives_with_coverage(devScale,
skvx::float2(minRadii[0], maxRadii[1])) &&
can_use_hw_derivatives_with_coverage(devScale,
skvx::float2(maxRadii[0], minRadii[1]));
}
case SkRRect::kComplex_Type: {
for (int i = 0; i < 4; ++i) {
auto corner = static_cast<SkRRect::Corner>(i);
if (!can_use_hw_derivatives_with_coverage(devScale, rrect.radii(corner))) {
return false;
}
}
return true;
}
}
SK_ABORT("Invalid round rect type.");
}
} // anonymous namespace
GrOp::Owner Make(GrRecordingContext* ctx,
SkArenaAlloc* arena,
GrPaint&& paint,
const SkMatrix& viewMatrix,
const SkRRect& rrect,
const SkRect& localRect,
GrAA aa) {
return FillRRectOpImpl::Make(ctx, arena, std::move(paint), viewMatrix, rrect, localRect, aa);
}
GrOp::Owner Make(GrRecordingContext* ctx,
SkArenaAlloc* arena,
GrPaint&& paint,
const SkMatrix& viewMatrix,
const SkRRect& rrect,
const SkMatrix& localMatrix,
GrAA aa) {
return FillRRectOpImpl::Make(ctx, arena, std::move(paint), viewMatrix, rrect, localMatrix, aa);
}
} // namespace skgpu::v1::FillRRectOp
#if GR_TEST_UTILS
#include "src/gpu/ganesh/GrDrawOpTest.h"
GR_DRAW_OP_TEST_DEFINE(FillRRectOp) {
SkArenaAlloc arena(64 * sizeof(float));
SkMatrix viewMatrix = GrTest::TestMatrix(random);
GrAA aa = GrAA(random->nextBool());
SkRect rect = GrTest::TestRect(random);
float w = rect.width();
float h = rect.height();
SkRRect rrect;
// TODO: test out other rrect configurations
rrect.setNinePatch(rect, w / 3.0f, h / 4.0f, w / 5.0f, h / 6.0);
return skgpu::v1::FillRRectOp::Make(context,
&arena,
std::move(paint),
viewMatrix,
rrect,
rrect.rect(),
aa);
}
#endif