From ce5c525d7738e60afed06dae0281d859581f4ea5 Mon Sep 17 00:00:00 2001 From: jonahwilliams Date: Fri, 31 Mar 2023 16:51:56 -0700 Subject: [PATCH 1/2] [Impeller] take advantage of native decal sampling --- .../contents/filters/blend_filter_contents.cc | 25 +++++++++++------ .../contents/framebuffer_blend_contents.cc | 9 ++++++- .../shaders/blending/advanced_blend.glsl | 27 ++++++++++++------- impeller/entity/shaders/blending/blend.frag | 6 ++--- impeller/entity/shaders/blending/blend.vert | 5 +++- .../blending/ios/framebuffer_blend.glsl | 6 ++--- 6 files changed, 52 insertions(+), 26 deletions(-) diff --git a/impeller/entity/contents/filters/blend_filter_contents.cc b/impeller/entity/contents/filters/blend_filter_contents.cc index ec215482d605e..1548d80c82da3 100644 --- a/impeller/entity/contents/filters/blend_filter_contents.cc +++ b/impeller/entity/contents/filters/blend_filter_contents.cc @@ -118,8 +118,13 @@ static std::optional AdvancedBlend( typename FS::BlendInfo blend_info; typename VS::FrameInfo frame_info; + auto dst_sampler_descriptor = dst_snapshot->sampler_descriptor; + if (renderer.GetDeviceCapabilities().SupportsDecalTileMode()) { + dst_sampler_descriptor.width_address_mode = SamplerAddressMode::kDecal; + dst_sampler_descriptor.height_address_mode = SamplerAddressMode::kDecal; + } auto dst_sampler = renderer.GetContext()->GetSamplerLibrary()->GetSampler( - dst_snapshot->sampler_descriptor); + dst_sampler_descriptor); FS::BindTextureSamplerDst(cmd, dst_snapshot->texture, dst_sampler); frame_info.dst_y_coord_scale = dst_snapshot->texture->GetYCoordScale(); blend_info.dst_input_alpha = absorb_opacity ? dst_snapshot->opacity : 1.0; @@ -132,8 +137,13 @@ static std::optional AdvancedBlend( // binding. FS::BindTextureSamplerSrc(cmd, dst_snapshot->texture, dst_sampler); } else { + auto src_sampler_descriptor = src_snapshot->sampler_descriptor; + if (renderer.GetDeviceCapabilities().SupportsDecalTileMode()) { + src_sampler_descriptor.width_address_mode = SamplerAddressMode::kDecal; + src_sampler_descriptor.height_address_mode = SamplerAddressMode::kDecal; + } auto src_sampler = renderer.GetContext()->GetSamplerLibrary()->GetSampler( - src_snapshot->sampler_descriptor); + src_sampler_descriptor); blend_info.color_factor = 0; FS::BindTextureSamplerSrc(cmd, src_snapshot->texture, src_sampler); frame_info.src_y_coord_scale = src_snapshot->texture->GetYCoordScale(); @@ -220,9 +230,10 @@ static std::optional PipelineBlend( frame_info.mvp = Matrix::MakeOrthographic(pass.GetRenderTargetSize()) * Matrix::MakeTranslation(-coverage.origin) * input->transform; - FS::FragInfo frag_info; - frag_info.texture_sampler_y_coord_scale = + frame_info.texture_sampler_y_coord_scale = input->texture->GetYCoordScale(); + + FS::FragInfo frag_info; frag_info.input_alpha = absorb_opacity ? input->opacity : 1.0; FS::BindFragInfo(cmd, host_buffer.EmplaceUniform(frag_info)); VS::BindFrameInfo(cmd, host_buffer.EmplaceUniform(frame_info)); @@ -257,10 +268,8 @@ static std::optional PipelineBlend( if (foreground_color.has_value()) { auto contents = std::make_shared(); - contents->SetGeometry(Geometry::MakeFillPath( - PathBuilder{} - .AddRect(Rect::MakeSize(pass.GetRenderTargetSize())) - .TakePath())); + contents->SetGeometry( + Geometry::MakeRect(Rect::MakeSize(pass.GetRenderTargetSize()))); contents->SetColor(foreground_color.value()); Entity foreground_entity; diff --git a/impeller/entity/contents/framebuffer_blend_contents.cc b/impeller/entity/contents/framebuffer_blend_contents.cc index 7b2699ce4f453..05c615681613a 100644 --- a/impeller/entity/contents/framebuffer_blend_contents.cc +++ b/impeller/entity/contents/framebuffer_blend_contents.cc @@ -128,8 +128,15 @@ bool FramebufferBlendContents::Render(const ContentContext& renderer, VS::FrameInfo frame_info; + auto src_sampler_descriptor = src_snapshot->sampler_descriptor; + if (!renderer.GetDeviceCapabilities().SupportsDecalTileMode()) { + // No known devices that support framebuffer fetch but not decal tile mode. + return false; + } + src_sampler_descriptor.width_address_mode = SamplerAddressMode::kDecal; + src_sampler_descriptor.height_address_mode = SamplerAddressMode::kDecal; auto src_sampler = renderer.GetContext()->GetSamplerLibrary()->GetSampler( - src_snapshot->sampler_descriptor); + src_sampler_descriptor); FS::BindTextureSamplerSrc(cmd, src_snapshot->texture, src_sampler); frame_info.mvp = Matrix::MakeOrthographic(pass.GetRenderTargetSize()) * diff --git a/impeller/entity/shaders/blending/advanced_blend.glsl b/impeller/entity/shaders/blending/advanced_blend.glsl index 6c1ce2ef4acdc..916abf8277a96 100644 --- a/impeller/entity/shaders/blending/advanced_blend.glsl +++ b/impeller/entity/shaders/blending/advanced_blend.glsl @@ -22,19 +22,28 @@ in vec2 v_src_texture_coords; out vec4 frag_color; +vec4 Sample(sampler2D texture_sampler, vec2 texture_coords) { +// gles 2.0 is the only backend without native decal support. +#ifdef IMPELLER_TARGET_OPENGLES + return IPSampleDecal(texture_sampler, texture_coords); +#else + return texture(texture_sampler, texture_coords); +#endif +} + void main() { - vec4 dst_sample = IPSampleDecal(texture_sampler_dst, // sampler - v_dst_texture_coords // texture coordinates - ) * + vec4 dst_sample = Sample(texture_sampler_dst, // sampler + v_dst_texture_coords // texture coordinates + ) * blend_info.dst_input_alpha; vec4 dst = IPUnpremultiply(dst_sample); - vec4 src = blend_info.color_factor > 0 - ? blend_info.color - : IPUnpremultiply(IPSampleDecal( - texture_sampler_src, // sampler - v_src_texture_coords // texture coordinates - )); + vec4 src = + blend_info.color_factor > 0 + ? blend_info.color + : IPUnpremultiply(Sample(texture_sampler_src, // sampler + v_src_texture_coords // texture coordinates + )); vec4 blended = vec4(Blend(dst.rgb, src.rgb), 1) * dst.a; diff --git a/impeller/entity/shaders/blending/blend.frag b/impeller/entity/shaders/blending/blend.frag index af401a151d98d..85e1d7a5a096b 100644 --- a/impeller/entity/shaders/blending/blend.frag +++ b/impeller/entity/shaders/blending/blend.frag @@ -8,7 +8,6 @@ uniform sampler2D texture_sampler_src; uniform FragInfo { - float texture_sampler_y_coord_scale; float input_alpha; } frag_info; @@ -18,7 +17,6 @@ in vec2 v_texture_coords; out vec4 frag_color; void main() { - frag_color = IPSample(texture_sampler_src, v_texture_coords, - frag_info.texture_sampler_y_coord_scale) * - frag_info.input_alpha; + frag_color = + texture(texture_sampler_src, v_texture_coords) * frag_info.input_alpha; } diff --git a/impeller/entity/shaders/blending/blend.vert b/impeller/entity/shaders/blending/blend.vert index 3b4a4bd430445..25a03cd442ccf 100644 --- a/impeller/entity/shaders/blending/blend.vert +++ b/impeller/entity/shaders/blending/blend.vert @@ -2,10 +2,12 @@ // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. +#include #include uniform FrameInfo { mat4 mvp; + float texture_sampler_y_coord_scale; } frame_info; @@ -16,5 +18,6 @@ out vec2 v_texture_coords; void main() { gl_Position = frame_info.mvp * vec4(vertices, 0.0, 1.0); - v_texture_coords = texture_coords; + v_texture_coords = + IPRemapCoords(texture_coords, frame_info.texture_sampler_y_coord_scale); } diff --git a/impeller/entity/shaders/blending/ios/framebuffer_blend.glsl b/impeller/entity/shaders/blending/ios/framebuffer_blend.glsl index 06324909a6af5..181e6ca9fd16f 100644 --- a/impeller/entity/shaders/blending/ios/framebuffer_blend.glsl +++ b/impeller/entity/shaders/blending/ios/framebuffer_blend.glsl @@ -34,9 +34,9 @@ void main() { vec4 dst_sample = ReadDestination(); vec4 dst = IPUnpremultiply(dst_sample); vec4 src = - IPUnpremultiply(IPSampleDecal(texture_sampler_src, // sampler - v_src_texture_coords // texture coordinates - )); + IPUnpremultiply(texture(texture_sampler_src, // sampler + v_src_texture_coords // texture coordinates + )); vec4 blended = vec4(Blend(dst.rgb, src.rgb), 1) * dst.a; From 42372d9bc9cce220ae67dcce6e5be85365741987 Mon Sep 17 00:00:00 2001 From: jonahwilliams Date: Fri, 31 Mar 2023 17:46:56 -0700 Subject: [PATCH 2/2] update malioc.json --- impeller/tools/malioc.json | 512 +++++++++++++++++-------------------- 1 file changed, 241 insertions(+), 271 deletions(-) diff --git a/impeller/tools/malioc.json b/impeller/tools/malioc.json index 9f6418deddff2..fe67ad301f581 100644 --- a/impeller/tools/malioc.json +++ b/impeller/tools/malioc.json @@ -124,7 +124,7 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 62, + "fp16_arithmetic": 59, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ @@ -134,8 +134,8 @@ "longest_path_cycles": [ 0.65625, 0.65625, - 0.53125, - 0.625, + 0.328125, + 0.25, 0.0, 0.5, 0.5 @@ -151,16 +151,16 @@ ], "shortest_path_bound_pipelines": [ "arith_total", - "arith_cvt" + "arith_fma" ], "shortest_path_cycles": [ - 0.359375, 0.328125, - 0.359375, - 0.25, + 0.328125, + 0.265625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ "arith_total", @@ -169,8 +169,8 @@ "total_cycles": [ 0.65625, 0.65625, - 0.578125, - 0.625, + 0.375, + 0.25, 0.0, 0.5, 0.5 @@ -197,18 +197,18 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 73, + "fp16_arithmetic": 70, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu" + "varying", + "texture" ], "longest_path_cycles": [ - 0.6875, + 0.4375, 0.296875, - 0.637499988079071, - 0.6875, + 0.4375, + 0.3125, 0.0, 0.5, 0.5 @@ -227,24 +227,23 @@ "arith_cvt" ], "shortest_path_cycles": [ - 0.515625, + 0.421875, 0.265625, - 0.515625, - 0.4375, + 0.421875, + 0.25, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_cvt", - "arith_sfu" + "varying", + "texture" ], "total_cycles": [ - 0.6875, + 0.484375, 0.296875, - 0.6875, - 0.6875, + 0.484375, + 0.3125, 0.0, 0.5, 0.5 @@ -253,7 +252,7 @@ "stack_spill_bytes": 0, "thread_occupancy": 100, "uniform_registers_used": 8, - "work_registers_used": 16 + "work_registers_used": 15 } } } @@ -271,18 +270,18 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 69, + "fp16_arithmetic": 65, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu" + "varying", + "texture" ], "longest_path_cycles": [ - 0.6875, + 0.4375, 0.265625, - 0.637499988079071, - 0.6875, + 0.4375, + 0.3125, 0.0, 0.5, 0.5 @@ -301,24 +300,23 @@ "arith_cvt" ], "shortest_path_cycles": [ - 0.515625, + 0.421875, 0.234375, - 0.515625, - 0.4375, + 0.421875, + 0.25, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_cvt", - "arith_sfu" + "varying", + "texture" ], "total_cycles": [ - 0.6875, + 0.484375, 0.265625, - 0.6875, - 0.6875, + 0.484375, + 0.3125, 0.0, 0.5, 0.5 @@ -327,7 +325,7 @@ "stack_spill_bytes": 0, "thread_occupancy": 100, "uniform_registers_used": 8, - "work_registers_used": 14 + "work_registers_used": 15 } } } @@ -349,16 +347,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, + 0.1875, 0.171875, - 0.390625, - 0.5, + 0.1875, + 0.125, 0.0, 0.5, 0.5 @@ -373,29 +369,27 @@ "texture" ], "shortest_path_bound_pipelines": [ - "arith_total", - "arith_cvt" + "varying", + "texture" ], "shortest_path_cycles": [ - 0.265625, + 0.171875, 0.140625, - 0.265625, - 0.25, + 0.171875, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, + 0.234375, 0.171875, - 0.4375, - 0.5, + 0.234375, + 0.125, 0.0, 0.5, 0.5 @@ -403,7 +397,7 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, + "uniform_registers_used": 8, "work_registers_used": 11 } } @@ -426,16 +420,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.203125, - 0.359375, - 0.5, + 0.203125, + 0.15625, + 0.125, 0.0, 0.5, 0.5 @@ -450,30 +442,27 @@ "texture" ], "shortest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", - "varying" + "varying", + "texture" ], "shortest_path_cycles": [ - 0.25, 0.171875, - 0.234375, - 0.25, + 0.171875, + 0.140625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.203125, - 0.40625, - 0.5, + 0.203125, + 0.203125, + 0.125, 0.0, 0.5, 0.5 @@ -481,7 +470,7 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, + "uniform_registers_used": 8, "work_registers_used": 11 } } @@ -504,16 +493,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.28125, - 0.359375, - 0.5, + 0.28125, + 0.15625, + 0.125, 0.0, 0.5, 0.5 @@ -530,29 +517,27 @@ "shortest_path_bound_pipelines": [ "arith_total", "arith_fma", - "arith_sfu", - "varying" + "varying", + "texture" ], "shortest_path_cycles": [ 0.25, 0.25, - 0.234375, - 0.25, + 0.140625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.28125, - 0.40625, - 0.5, + 0.28125, + 0.203125, + 0.125, 0.0, 0.5, 0.5 @@ -560,8 +545,8 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, - "work_registers_used": 11 + "uniform_registers_used": 8, + "work_registers_used": 12 } } } @@ -583,16 +568,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.46875, - 0.421875, - 0.5, + 0.46875, + 0.21875, + 0.125, 0.0, 0.5, 0.5 @@ -613,23 +596,21 @@ "shortest_path_cycles": [ 0.4375, 0.4375, - 0.296875, - 0.25, + 0.203125, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.46875, 0.46875, - 0.5, + 0.265625, + 0.125, 0.0, 0.5, 0.5 @@ -656,7 +637,7 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 70, + "fp16_arithmetic": 69, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ @@ -666,8 +647,8 @@ "longest_path_cycles": [ 0.762499988079071, 0.762499988079071, - 0.6875, - 0.6875, + 0.5, + 0.3125, 0.0, 0.5, 0.5 @@ -686,23 +667,23 @@ "arith_cvt" ], "shortest_path_cycles": [ - 0.5, + 0.390625, 0.328125, - 0.5, - 0.25, + 0.390625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ "arith_total", - "arith_cvt" + "arith_fma" ], "total_cycles": [ - 0.78125, 0.762499988079071, - 0.78125, - 0.6875, + 0.762499988079071, + 0.578125, + 0.3125, 0.0, 0.5, 0.5 @@ -733,16 +714,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, + 0.1875, 0.171875, - 0.390625, - 0.5, + 0.1875, + 0.125, 0.0, 0.5, 0.5 @@ -757,29 +736,27 @@ "texture" ], "shortest_path_bound_pipelines": [ - "arith_total", - "arith_cvt" + "varying", + "texture" ], "shortest_path_cycles": [ - 0.265625, + 0.171875, 0.140625, - 0.265625, - 0.25, + 0.171875, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, + 0.234375, 0.171875, - 0.4375, - 0.5, + 0.234375, + 0.125, 0.0, 0.5, 0.5 @@ -787,7 +764,7 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, + "uniform_registers_used": 8, "work_registers_used": 11 } } @@ -806,7 +783,7 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 62, + "fp16_arithmetic": 59, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ @@ -816,8 +793,8 @@ "longest_path_cycles": [ 0.65625, 0.65625, - 0.53125, - 0.625, + 0.328125, + 0.25, 0.0, 0.5, 0.5 @@ -833,16 +810,16 @@ ], "shortest_path_bound_pipelines": [ "arith_total", - "arith_cvt" + "arith_fma" ], "shortest_path_cycles": [ - 0.359375, 0.328125, - 0.359375, - 0.25, + 0.328125, + 0.265625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ "arith_total", @@ -851,8 +828,8 @@ "total_cycles": [ 0.65625, 0.65625, - 0.578125, - 0.625, + 0.375, + 0.25, 0.0, 0.5, 0.5 @@ -883,16 +860,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.203125, - 0.359375, - 0.5, + 0.203125, + 0.15625, + 0.125, 0.0, 0.5, 0.5 @@ -907,30 +882,27 @@ "texture" ], "shortest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", - "varying" + "varying", + "texture" ], "shortest_path_cycles": [ - 0.25, 0.171875, - 0.234375, - 0.25, + 0.171875, + 0.140625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.203125, - 0.40625, - 0.5, + 0.203125, + 0.203125, + 0.125, 0.0, 0.5, 0.5 @@ -938,7 +910,7 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, + "uniform_registers_used": 8, "work_registers_used": 11 } } @@ -961,16 +933,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.46875, - 0.421875, - 0.5, + 0.46875, + 0.21875, + 0.125, 0.0, 0.5, 0.5 @@ -991,23 +961,21 @@ "shortest_path_cycles": [ 0.4375, 0.4375, - 0.296875, - 0.25, + 0.203125, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.46875, 0.46875, - 0.5, + 0.265625, + 0.125, 0.0, 0.5, 0.5 @@ -1034,7 +1002,7 @@ "uses_late_zs_update": false, "variants": { "Main": { - "fp16_arithmetic": 70, + "fp16_arithmetic": 69, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ @@ -1044,8 +1012,8 @@ "longest_path_cycles": [ 0.762499988079071, 0.762499988079071, - 0.6875, - 0.6875, + 0.5, + 0.3125, 0.0, 0.5, 0.5 @@ -1064,23 +1032,23 @@ "arith_cvt" ], "shortest_path_cycles": [ - 0.5, + 0.390625, 0.328125, - 0.5, - 0.25, + 0.390625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ "arith_total", - "arith_cvt" + "arith_fma" ], "total_cycles": [ - 0.78125, 0.762499988079071, - 0.78125, - 0.6875, + 0.762499988079071, + 0.578125, + 0.3125, 0.0, 0.5, 0.5 @@ -1111,16 +1079,14 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "longest_path_cycles": [ - 0.5, 0.25, - 0.359375, - 0.5, + 0.25, + 0.15625, + 0.125, 0.0, 0.5, 0.5 @@ -1135,30 +1101,27 @@ "texture" ], "shortest_path_bound_pipelines": [ - "arith_total", - "arith_sfu", - "varying" + "varying", + "texture" ], "shortest_path_cycles": [ - 0.25, 0.21875, - 0.234375, - 0.25, + 0.21875, + 0.140625, + 0.0625, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ - "arith_total", - "arith_sfu", "varying", "texture" ], "total_cycles": [ - 0.5, 0.25, - 0.40625, - 0.5, + 0.25, + 0.203125, + 0.125, 0.0, 0.5, 0.5 @@ -1166,7 +1129,7 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 6, + "uniform_registers_used": 8, "work_registers_used": 11 } } @@ -1195,8 +1158,8 @@ "longest_path_cycles": [ 0.78125, 0.78125, - 0.5625, - 0.6875, + 0.359375, + 0.3125, 0.0, 0.5, 0.5 @@ -1217,11 +1180,11 @@ "shortest_path_cycles": [ 0.75, 0.75, - 0.4375, - 0.4375, + 0.34375, + 0.25, 0.0, 0.25, - 0.0 + 0.25 ], "total_bound_pipelines": [ "arith_total", @@ -1230,8 +1193,8 @@ "total_cycles": [ 0.78125, 0.78125, - 0.609375, - 0.6875, + 0.40625, + 0.3125, 0.0, 0.5, 0.5 @@ -1240,7 +1203,7 @@ "stack_spill_bytes": 0, "thread_occupancy": 100, "uniform_registers_used": 12, - "work_registers_used": 25 + "work_registers_used": 21 } } } @@ -1262,15 +1225,16 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ + "varying", "texture" ], "longest_path_cycles": [ - 0.0625, - 0.046875, - 0.0625, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.0, + 0.25, 0.25 ], "pipelines": [ @@ -1283,34 +1247,36 @@ "texture" ], "shortest_path_bound_pipelines": [ + "varying", "texture" ], "shortest_path_cycles": [ - 0.0625, - 0.046875, - 0.0625, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.0, + 0.25, 0.25 ], "total_bound_pipelines": [ + "varying", "texture" ], "total_cycles": [ - 0.0625, - 0.046875, - 0.0625, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.0, + 0.25, 0.25 ] }, "stack_spill_bytes": 0, "thread_occupancy": 100, "uniform_registers_used": 4, - "work_registers_used": 6 + "work_registers_used": 4 } } } @@ -1370,20 +1336,20 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 18, + "uniform_registers_used": 20, "work_registers_used": 32 }, "Varying": { - "fp16_arithmetic": null, + "fp16_arithmetic": 100, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ "load_store" ], "longest_path_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -1400,9 +1366,9 @@ "load_store" ], "shortest_path_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -1411,9 +1377,9 @@ "load_store" ], "total_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -1421,8 +1387,8 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 14, - "work_registers_used": 6 + "uniform_registers_used": 16, + "work_registers_used": 7 } } } @@ -5522,7 +5488,7 @@ "core": "Mali-G78", "filename": "flutter/impeller/entity/gles/blend.frag.gles", "has_side_effects": false, - "has_uniform_computation": true, + "has_uniform_computation": false, "modifies_coverage": false, "reads_color_buffer": false, "type": "Fragment", @@ -5534,15 +5500,16 @@ "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ + "varying", "texture" ], "longest_path_cycles": [ - 0.09375, - 0.046875, - 0.09375, + 0.03125, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.25, 0.25 ], "pipelines": [ @@ -5555,27 +5522,29 @@ "texture" ], "shortest_path_bound_pipelines": [ + "varying", "texture" ], "shortest_path_cycles": [ - 0.0625, - 0.046875, - 0.0625, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.0, + 0.25, 0.25 ], "total_bound_pipelines": [ + "varying", "texture" ], "total_cycles": [ - 0.09375, - 0.046875, - 0.09375, + 0.03125, + 0.03125, + 0.03125, 0.0, 0.0, - 0.125, + 0.25, 0.25 ] }, @@ -5621,10 +5590,11 @@ 1.0 ], "total_bound_pipelines": [ - "arithmetic" + "load_store", + "texture" ], "total_cycles": [ - 1.3333333730697632, + 0.6666666865348816, 1.0, 1.0 ] @@ -5640,7 +5610,7 @@ "Mali-G78": { "core": "Mali-G78", "filename": "flutter/impeller/entity/gles/blend.vert.gles", - "has_uniform_computation": false, + "has_uniform_computation": true, "type": "Vertex", "variants": { "Position": { @@ -5691,20 +5661,20 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 14, + "uniform_registers_used": 16, "work_registers_used": 32 }, "Varying": { - "fp16_arithmetic": null, + "fp16_arithmetic": 100, "has_stack_spilling": false, "performance": { "longest_path_bound_pipelines": [ "load_store" ], "longest_path_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -5721,9 +5691,9 @@ "load_store" ], "shortest_path_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -5732,9 +5702,9 @@ "load_store" ], "total_cycles": [ - 0.0, - 0.0, - 0.0, + 0.03125, + 0.015625, + 0.03125, 0.0, 3.0, 0.0 @@ -5742,8 +5712,8 @@ }, "stack_spill_bytes": 0, "thread_occupancy": 100, - "uniform_registers_used": 8, - "work_registers_used": 6 + "uniform_registers_used": 10, + "work_registers_used": 7 } } }, @@ -5760,7 +5730,7 @@ "load_store" ], "longest_path_cycles": [ - 2.640000104904175, + 2.9700000286102295, 5.0, 0.0 ], @@ -5773,7 +5743,7 @@ "load_store" ], "shortest_path_cycles": [ - 2.640000104904175, + 2.9700000286102295, 5.0, 0.0 ], @@ -5781,7 +5751,7 @@ "load_store" ], "total_cycles": [ - 2.6666667461395264, + 3.0, 5.0, 0.0 ]