1 #include <msp/core/algorithm.h>
2 #include <msp/core/hash.h>
8 #include "framebuffer.h"
9 #include "pipelinestate.h"
10 #include "pipelinestate_backend.h"
14 #include "stenciltest.h"
15 #include "structurebuilder.h"
17 #include "uniformblock.h"
18 #include "vertexsetup.h"
26 VulkanPipelineState::VulkanPipelineState():
27 device(Device::get_current())
30 VulkanPipelineState::VulkanPipelineState(VulkanPipelineState &&other):
35 void VulkanPipelineState::update() const
37 const PipelineState &self = *static_cast<const PipelineState *>(this);
39 unapplied |= changes&(PipelineState::VIEWPORT|PipelineState::SCISSOR|PipelineState::VERTEX_SETUP);
41 if(changes&PipelineState::VERTEX_SETUP)
42 self.vertex_setup->refresh();
44 if(changes&PipelineState::SHPROG)
46 push_const_compat = hash<32>(self.shprog->stage_flags);
47 push_const_compat = hash_update<32>(push_const_compat, self.shprog->get_push_constants_size());
50 constexpr unsigned pipeline_mask = PipelineState::SHPROG|PipelineState::VERTEX_SETUP|PipelineState::FACE_CULL|
51 PipelineState::DEPTH_TEST|PipelineState::STENCIL_TEST|PipelineState::BLEND|PipelineState::PRIMITIVE_TYPE;
52 if(changes&pipeline_mask)
54 handle = device.get_pipeline_cache().get_pipeline(self);
55 unapplied |= PipelineState::SHPROG;
58 if(changes&(PipelineState::SHPROG|PipelineState::UNIFORMS|PipelineState::TEXTURES))
60 unsigned changed_sets = (changes&PipelineState::SHPROG ? ~0U : 0U);
61 for(const PipelineState::BoundUniformBlock &u: self.uniform_blocks)
62 if(u.changed || changed_sets==~0U)
65 u.used = self.shprog->uses_uniform_block_binding(u.binding);
67 changed_sets |= 1<<(u.binding>>20);
70 for(const PipelineState::BoundTexture &t: self.textures)
71 if(t.changed || changed_sets==~0U)
73 if(t.texture && t.sampler)
74 t.used = self.shprog->uses_texture_binding(t.binding);
75 changed_sets |= 1<<(t.binding>>20);
76 if(t.texture && t.level>=0)
77 t.texture->refresh_mip_views();
85 descriptor_set_slots.resize(self.shprog->get_n_descriptor_sets());
86 first_changed_desc_set = descriptor_set_slots.size();
87 for(unsigned i=0; i<descriptor_set_slots.size(); ++i)
88 if(changed_sets&(1<<i))
90 descriptor_set_slots[i] = device.get_descriptor_pool().get_descriptor_set_slot(self, i);
91 first_changed_desc_set = min(first_changed_desc_set, i);
94 unapplied |= PipelineState::UNIFORMS;
101 uint64_t VulkanPipelineState::compute_hash() const
103 const PipelineState &self = *static_cast<const PipelineState *>(this);
104 const FrameFormat &format = self.framebuffer->get_format();
106 uint64_t result = hash<64>(self.shprog);
107 result = hash_update<64>(result, self.vertex_setup->compute_hash());
108 result = hash_round<64>(result, self.primitive_type);
110 if(self.front_face!=NON_MANIFOLD && self.face_cull!=NO_CULL)
112 result = hash_round<64>(result, self.front_face);
113 result = hash_round<64>(result, self.face_cull);
116 result = hash_round<64>(result, format.get_samples());
118 if(self.depth_test.enabled)
120 result = hash_round<64>(result, self.depth_test.compare);
121 result = hash_update<64>(result, self.depth_test.write);
124 if(self.stencil_test.enabled)
126 result = hash_round<64>(result, self.stencil_test.compare);
127 result = hash_round<64>(result, self.stencil_test.stencil_fail_op);
128 result = hash_round<64>(result, self.stencil_test.depth_fail_op);
129 result = hash_round<64>(result, self.stencil_test.depth_pass_op);
130 result = hash_update<64>(result, self.stencil_test.reference);
133 if(self.blend.enabled)
135 result = hash_round<64>(result, self.blend.equation);
136 result = hash_round<64>(result, self.blend.src_factor);
137 result = hash_round<64>(result, self.blend.dst_factor);
138 result = hash_round<64>(result, self.blend.write_mask);
141 for(FrameAttachment a: format)
142 result = hash_update<64>(result, a);
147 void VulkanPipelineState::fill_creation_info(vector<char> &buffer) const
149 const PipelineState &self = *static_cast<const PipelineState *>(this);
151 const FrameFormat &format = self.framebuffer->get_format();
152 VkRenderPass render_pass = device.get_pipeline_cache().get_render_pass(format, false, false, false);
154 unsigned n_color_attachments = 0;
155 for(FrameAttachment a: format)
157 unsigned attach_pt = get_attach_point(a);
158 if(attach_pt!=get_attach_point(DEPTH_ATTACHMENT) && attach_pt!=get_attach_point(STENCIL_ATTACHMENT))
159 ++n_color_attachments;
162 StructureBuilder sb(buffer, 10);
163 VkGraphicsPipelineCreateInfo *const &pipeline_info = sb.add<VkGraphicsPipelineCreateInfo>();
164 VkPipelineInputAssemblyStateCreateInfo *const &input_assembly_info = sb.add<VkPipelineInputAssemblyStateCreateInfo>();
165 VkPipelineViewportStateCreateInfo *const &viewport_info = sb.add<VkPipelineViewportStateCreateInfo>();
166 VkPipelineRasterizationStateCreateInfo *const &raster_info = sb.add<VkPipelineRasterizationStateCreateInfo>();
167 VkPipelineMultisampleStateCreateInfo *const &multisample_info = sb.add<VkPipelineMultisampleStateCreateInfo>();
168 VkPipelineDepthStencilStateCreateInfo *const &depth_stencil_info = sb.add<VkPipelineDepthStencilStateCreateInfo>();
169 VkPipelineColorBlendStateCreateInfo *const &blend_info = sb.add<VkPipelineColorBlendStateCreateInfo>();
170 VkPipelineColorBlendAttachmentState *const &blend_attachments = sb.add<VkPipelineColorBlendAttachmentState>(n_color_attachments);
171 VkPipelineDynamicStateCreateInfo *const &dynamic_info = sb.add<VkPipelineDynamicStateCreateInfo>();
172 VkDynamicState *const &dynamic_states = sb.add<VkDynamicState>(2);
174 input_assembly_info->sType = VK_STRUCTURE_TYPE_PIPELINE_INPUT_ASSEMBLY_STATE_CREATE_INFO;
175 input_assembly_info->topology = static_cast<VkPrimitiveTopology>(get_vulkan_primitive_type(self.primitive_type));
176 input_assembly_info->primitiveRestartEnable = true;
178 viewport_info->sType = VK_STRUCTURE_TYPE_PIPELINE_VIEWPORT_STATE_CREATE_INFO;
179 viewport_info->viewportCount = 1;
180 viewport_info->pViewports = 0;
181 viewport_info->scissorCount = 1;
182 viewport_info->pScissors = 0;
184 raster_info->sType = VK_STRUCTURE_TYPE_PIPELINE_RASTERIZATION_STATE_CREATE_INFO;
185 raster_info->depthClampEnable = VK_FALSE;
186 raster_info->rasterizerDiscardEnable = VK_FALSE;
187 raster_info->polygonMode = VK_POLYGON_MODE_FILL;
188 raster_info->frontFace = (self.front_face==CLOCKWISE ? VK_FRONT_FACE_COUNTER_CLOCKWISE : VK_FRONT_FACE_CLOCKWISE);
189 if(self.face_cull==NO_CULL || self.front_face==NON_MANIFOLD)
190 raster_info->cullMode = VK_CULL_MODE_NONE;
192 raster_info->cullMode = (self.face_cull==CULL_FRONT ? VK_CULL_MODE_FRONT_BIT : VK_CULL_MODE_BACK_BIT);
193 raster_info->depthBiasEnable = VK_FALSE;
194 raster_info->depthBiasConstantFactor = 0.0f;
195 raster_info->depthBiasClamp = 0.0f;
196 raster_info->depthBiasSlopeFactor = 0.0f;
197 raster_info->lineWidth = 1.0f;
199 multisample_info->sType = VK_STRUCTURE_TYPE_PIPELINE_MULTISAMPLE_STATE_CREATE_INFO;
200 multisample_info->rasterizationSamples = static_cast<VkSampleCountFlagBits>(get_vulkan_samples(format.get_samples()));
201 multisample_info->sampleShadingEnable = VK_FALSE;
202 multisample_info->minSampleShading = 1.0f;
203 multisample_info->pSampleMask = 0;
204 multisample_info->alphaToCoverageEnable = VK_FALSE;
205 multisample_info->alphaToOneEnable = VK_FALSE;
207 depth_stencil_info->sType = VK_STRUCTURE_TYPE_PIPELINE_DEPTH_STENCIL_STATE_CREATE_INFO;
208 depth_stencil_info->depthTestEnable = self.depth_test.enabled;
209 depth_stencil_info->depthWriteEnable = self.depth_test.write;
210 depth_stencil_info->depthCompareOp = static_cast<VkCompareOp>(get_vulkan_predicate(self.depth_test.compare));
211 depth_stencil_info->depthBoundsTestEnable = VK_FALSE;
213 depth_stencil_info->stencilTestEnable = self.stencil_test.enabled;
214 depth_stencil_info->front.failOp = static_cast<VkStencilOp>(get_vulkan_stencil_op(self.stencil_test.stencil_fail_op));
215 depth_stencil_info->front.passOp = static_cast<VkStencilOp>(get_vulkan_stencil_op(self.stencil_test.depth_pass_op));
216 depth_stencil_info->front.depthFailOp = static_cast<VkStencilOp>(get_vulkan_stencil_op(self.stencil_test.depth_fail_op));
217 depth_stencil_info->front.compareOp = static_cast<VkCompareOp>(get_vulkan_predicate(self.stencil_test.compare));
218 depth_stencil_info->front.compareMask = 0xFFFFFFFFU;
219 depth_stencil_info->front.writeMask = 0xFFFFFFFFU;
220 depth_stencil_info->front.reference = self.stencil_test.reference;
221 depth_stencil_info->back = depth_stencil_info->front;
223 for(unsigned i=0; i<n_color_attachments; ++i)
225 blend_attachments[i].blendEnable = self.blend.enabled;
226 blend_attachments[i].srcColorBlendFactor = static_cast<VkBlendFactor>(get_vulkan_blend_factor(self.blend.src_factor));
227 blend_attachments[i].dstColorBlendFactor = static_cast<VkBlendFactor>(get_vulkan_blend_factor(self.blend.dst_factor));
228 blend_attachments[i].colorBlendOp = static_cast<VkBlendOp>(get_vulkan_blend_equation(self.blend.equation));
229 blend_attachments[i].srcAlphaBlendFactor = blend_attachments[i].srcColorBlendFactor;
230 blend_attachments[i].dstAlphaBlendFactor = blend_attachments[i].dstColorBlendFactor;
231 blend_attachments[i].alphaBlendOp = blend_attachments[i].colorBlendOp;
232 blend_attachments[i].colorWriteMask = get_vulkan_color_mask(self.blend.write_mask);
235 blend_info->sType = VK_STRUCTURE_TYPE_PIPELINE_COLOR_BLEND_STATE_CREATE_INFO;
236 blend_info->attachmentCount = n_color_attachments;
237 blend_info->pAttachments = blend_attachments;
239 dynamic_states[0] = VK_DYNAMIC_STATE_VIEWPORT;
240 dynamic_states[1] = VK_DYNAMIC_STATE_SCISSOR;
242 dynamic_info->sType = VK_STRUCTURE_TYPE_PIPELINE_DYNAMIC_STATE_CREATE_INFO;
243 dynamic_info->dynamicStateCount = 2;
244 dynamic_info->pDynamicStates = dynamic_states;
246 pipeline_info->sType = VK_STRUCTURE_TYPE_GRAPHICS_PIPELINE_CREATE_INFO;
248 pipeline_info->pInputAssemblyState = input_assembly_info;
249 pipeline_info->pTessellationState = 0;
250 pipeline_info->pViewportState = viewport_info;
251 pipeline_info->pRasterizationState = raster_info;
252 pipeline_info->pMultisampleState = multisample_info;
253 pipeline_info->pDepthStencilState = depth_stencil_info;
254 pipeline_info->pColorBlendState = blend_info;
255 pipeline_info->pDynamicState = dynamic_info;
256 pipeline_info->renderPass = handle_cast<::VkRenderPass>(render_pass);
257 pipeline_info->subpass = 0;
261 pipeline_info->stageCount = self.shprog->n_stages;
262 pipeline_info->pStages = reinterpret_cast<const VkPipelineShaderStageCreateInfo *>(self.shprog->creation_info.data());
263 pipeline_info->layout = handle_cast<::VkPipelineLayout>(self.shprog->layout_handle);
266 if(self.vertex_setup)
267 pipeline_info->pVertexInputState = reinterpret_cast<const VkPipelineVertexInputStateCreateInfo *>(self.vertex_setup->creation_info.data());
270 uint64_t VulkanPipelineState::compute_descriptor_set_hash(unsigned index) const
272 const PipelineState &self = *static_cast<const PipelineState *>(this);
274 uint64_t result = hash<64>(0, 0);
277 auto i = lower_bound_member(self.uniform_blocks, static_cast<int>(index)<<20, &PipelineState::BoundUniformBlock::binding);
278 for(; (i!=self.uniform_blocks.end() && static_cast<unsigned>(i->binding)>>20==index); ++i)
281 result = hash_update<64>(result, i->binding);
282 result = hash_update<64>(result, reinterpret_cast<uintptr_t>(i->block));
283 result = hash_update<64>(result, reinterpret_cast<uintptr_t>(i->buffer->handle));
287 auto j = lower_bound_member(self.textures, index<<20, &PipelineState::BoundTexture::binding);
288 for(; (j!=self.textures.end() && j->binding>>20==index); ++j)
291 result = hash_update<64>(result, j->binding);
292 result = hash_update<64>(result, reinterpret_cast<uintptr_t>(j->texture->handle));
293 result = hash_update<64>(result, reinterpret_cast<uintptr_t>(j->sampler->handle));
294 result = hash_update<64>(result, j->level);
299 result = hash_update<64>(result, self.shprog->stage_flags);
304 bool VulkanPipelineState::is_descriptor_set_dynamic(unsigned index) const
306 const PipelineState &self = *static_cast<const PipelineState *>(this);
308 auto i = lower_bound_member(self.uniform_blocks, static_cast<int>(index)<<20, &PipelineState::BoundUniformBlock::binding);
309 for(; (i!=self.uniform_blocks.end() && static_cast<unsigned>(i->binding)>>20==index); ++i)
310 if(i->used && i->buffer && i->buffer->get_usage()==STREAMING)
316 VkDescriptorSetLayout VulkanPipelineState::get_descriptor_set_layout(unsigned index) const
318 return static_cast<const PipelineState *>(this)->shprog->desc_set_layout_handles[index];
321 unsigned VulkanPipelineState::fill_descriptor_writes(unsigned index, unsigned frame, vector<char> &buffer) const
323 const PipelineState &self = *static_cast<const PipelineState *>(this);
325 auto u_begin = lower_bound_member(self.uniform_blocks, static_cast<int>(index)<<20, &PipelineState::BoundUniformBlock::binding);
326 auto t_begin = lower_bound_member(self.textures, index<<20, &PipelineState::BoundTexture::binding);
328 unsigned n_buffers = 0;
329 for(auto i=u_begin; (i!=self.uniform_blocks.end() && static_cast<unsigned>(i->binding)>>20==index); ++i)
332 unsigned n_images = 0;
333 for(auto i=t_begin; (i!=self.textures.end() && i->binding>>20==index); ++i)
336 unsigned n_writes = n_buffers+n_images;
338 StructureBuilder sb(buffer, 3);
339 VkWriteDescriptorSet *const &writes = sb.add<VkWriteDescriptorSet>(n_writes);
340 VkDescriptorBufferInfo *const &buffers = sb.add<VkDescriptorBufferInfo>(n_buffers);
341 VkDescriptorImageInfo *const &images = sb.add<VkDescriptorImageInfo>(n_images);
343 VkWriteDescriptorSet *write_ptr = writes;
344 VkDescriptorBufferInfo *buffer_ptr = buffers;
345 VkDescriptorImageInfo *image_ptr = images;
347 for(auto i=u_begin; (i!=self.uniform_blocks.end() && static_cast<unsigned>(i->binding)>>20==index); ++i)
350 buffer_ptr->buffer = handle_cast<::VkBuffer>(i->buffer->handle);
351 buffer_ptr->offset = i->block->get_offset();
352 if(i->buffer->get_usage()==STREAMING)
353 buffer_ptr->offset += frame*i->buffer->get_size();
354 buffer_ptr->range = i->block->get_data_size();
356 write_ptr->sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET;
357 write_ptr->dstBinding = i->binding&0xFFFFF;
358 write_ptr->descriptorCount = 1;
359 write_ptr->descriptorType = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER;
360 write_ptr->pBufferInfo = buffer_ptr;
366 for(auto i=t_begin; (i!=self.textures.end() && i->binding>>20==index); ++i)
369 image_ptr->sampler = handle_cast<::VkSampler>(i->sampler->handle);
371 image_ptr->imageView = handle_cast<::VkImageView>(i->texture->view_handle);
373 image_ptr->imageView = handle_cast<::VkImageView>(i->texture->mip_view_handles[i->level]);
374 image_ptr->imageLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
376 write_ptr->sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET;
377 write_ptr->dstBinding = i->binding&0xFFFFF;
378 write_ptr->descriptorCount = 1;
379 write_ptr->descriptorType = VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER;
380 write_ptr->pImageInfo = image_ptr;
389 void VulkanPipelineState::apply(const VulkanCommandRecorder &vkCmd, const VulkanPipelineState *last, unsigned frame, bool negative_viewport) const
391 const PipelineState &self = *static_cast<const PipelineState *>(this);
396 first_changed_desc_set = 0;
400 const PipelineState &last_ps = *static_cast<const PipelineState *>(last);
401 if(handle!=last->handle)
403 unapplied |= PipelineState::SHPROG;
404 if(self.push_const_compat!=last_ps.push_const_compat)
406 unapplied |= PipelineState::UNIFORMS;
407 first_changed_desc_set = 0;
410 if(self.vertex_setup!=last_ps.vertex_setup)
411 unapplied |= PipelineState::VERTEX_SETUP;
412 for(unsigned i=0; i<descriptor_set_slots.size(); ++i)
413 if(i>=last->descriptor_set_slots.size() || descriptor_set_slots[i]!=last->descriptor_set_slots[i])
415 unapplied |= PipelineState::UNIFORMS;
416 first_changed_desc_set = min(first_changed_desc_set, i);
419 if(self.viewport!=last_ps.viewport)
420 unapplied |= PipelineState::VIEWPORT;
421 if(self.scissor!=last_ps.scissor)
422 unapplied |= PipelineState::SCISSOR;
425 if(unapplied&PipelineState::SHPROG)
426 vkCmd.BindPipeline(VK_PIPELINE_BIND_POINT_GRAPHICS, handle);
428 if(unapplied&PipelineState::VERTEX_SETUP)
429 if(const VertexSetup *vs = self.vertex_setup)
431 vkCmd.BindVertexBuffers(0, vs->n_bindings, vs->buffers, vs->offsets);
432 VkIndexType index_type = static_cast<VkIndexType>(get_vulkan_index_type(vs->get_index_type()));
433 vkCmd.BindIndexBuffer(vs->get_index_buffer()->handle, 0, index_type);
436 if(!self.uniform_blocks.empty())
438 const PipelineState::BoundUniformBlock &first_block = self.uniform_blocks.front();
439 if(first_block.used && first_block.binding==ReflectData::PUSH_CONSTANT)
441 const UniformBlock &pc_block = *first_block.block;
442 vkCmd.PushConstants(self.shprog->layout_handle, self.shprog->stage_flags,
443 pc_block.get_offset(), pc_block.get_data_size(), pc_block.get_data_pointer());
447 if((unapplied&PipelineState::UNIFORMS) && !descriptor_set_slots.empty())
449 vector<VkDescriptorSet> descriptor_set_handles;
450 descriptor_set_handles.reserve(descriptor_set_slots.size()-first_changed_desc_set);
451 for(unsigned i=first_changed_desc_set; i<descriptor_set_slots.size(); ++i)
452 descriptor_set_handles.push_back(device.get_descriptor_pool().get_descriptor_set(
453 self.descriptor_set_slots[i], self, i, frame));
455 vkCmd.BindDescriptorSets(VK_PIPELINE_BIND_POINT_GRAPHICS, self.shprog->layout_handle,
456 first_changed_desc_set, descriptor_set_handles.size(), descriptor_set_handles.data(), 0, 0);
459 if(unapplied&(PipelineState::VIEWPORT|PipelineState::SCISSOR))
461 Rect fb_rect = self.framebuffer->get_rect();
463 if(unapplied&PipelineState::VIEWPORT)
465 Rect viewport_rect = fb_rect.intersect(self.viewport);
466 VkViewport viewport = { };
467 viewport.x = viewport_rect.left;
468 viewport.y = viewport_rect.bottom;
469 viewport.width = viewport_rect.width;
470 viewport.height = viewport_rect.height;
471 if(negative_viewport)
473 viewport.y += viewport.height;
474 viewport.height = -viewport.height;
476 viewport.minDepth = 0.0f;
477 viewport.maxDepth = 1.0f;
478 vkCmd.SetViewport(0, 1, &viewport);
481 if(unapplied&PipelineState::SCISSOR)
483 Rect scissor_rect = fb_rect.intersect(self.scissor);
484 VkRect2D scissor = { };
485 scissor.offset.x = scissor_rect.left;
486 scissor.offset.y = scissor_rect.bottom;
487 scissor.extent.width = scissor_rect.width;
488 scissor.extent.height = scissor_rect.height;
489 vkCmd.SetScissor(0, 1, &scissor);
494 first_changed_desc_set = descriptor_set_slots.size();