mesa/src/gallium/frontends/lavapipe/lvp_private.h

667 lines
20 KiB
C

/*
* Copyright © 2019 Red Hat.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE.
*/
#pragma once
#include <stdlib.h>
#include <stdio.h>
#include <stdbool.h>
#include <string.h>
#include <assert.h>
#include <stdint.h>
#include "util/macros.h"
#include "util/list.h"
#include "util/u_dynarray.h"
#include "util/simple_mtx.h"
#include "util/u_queue.h"
#include "util/u_upload_mgr.h"
#include "compiler/shader_enums.h"
#include "pipe/p_screen.h"
#include "pipe/p_state.h"
#include "cso_cache/cso_context.h"
#include "nir.h"
/* Pre-declarations needed for WSI entrypoints */
struct wl_surface;
struct wl_display;
typedef struct xcb_connection_t xcb_connection_t;
typedef uint32_t xcb_visualid_t;
typedef uint32_t xcb_window_t;
#define VK_PROTOTYPES
#include <vulkan/vulkan.h>
#include <vulkan/vk_icd.h>
#include "lvp_entrypoints.h"
#include "vk_device.h"
#include "vk_instance.h"
#include "vk_image.h"
#include "vk_log.h"
#include "vk_physical_device.h"
#include "vk_shader_module.h"
#include "vk_util.h"
#include "vk_format.h"
#include "vk_cmd_queue.h"
#include "vk_command_buffer.h"
#include "vk_command_pool.h"
#include "vk_queue.h"
#include "wsi_common.h"
#include <assert.h>
#ifdef __cplusplus
extern "C" {
#endif
#define MAX_SETS 8
#define MAX_PUSH_CONSTANTS_SIZE 128
#define MAX_PUSH_DESCRIPTORS 32
#define MAX_DESCRIPTOR_UNIFORM_BLOCK_SIZE 4096
#define MAX_PER_STAGE_DESCRIPTOR_UNIFORM_BLOCKS 8
#ifdef _WIN32
#define lvp_printflike(a, b)
#else
#define lvp_printflike(a, b) __attribute__((__format__(__printf__, a, b)))
#endif
int lvp_get_instance_entrypoint_index(const char *name);
int lvp_get_device_entrypoint_index(const char *name);
int lvp_get_physical_device_entrypoint_index(const char *name);
const char *lvp_get_instance_entry_name(int index);
const char *lvp_get_physical_device_entry_name(int index);
const char *lvp_get_device_entry_name(int index);
bool lvp_instance_entrypoint_is_enabled(int index, uint32_t core_version,
const struct vk_instance_extension_table *instance);
bool lvp_physical_device_entrypoint_is_enabled(int index, uint32_t core_version,
const struct vk_instance_extension_table *instance);
bool lvp_device_entrypoint_is_enabled(int index, uint32_t core_version,
const struct vk_instance_extension_table *instance,
const struct vk_device_extension_table *device);
#define LVP_DEBUG_ALL_ENTRYPOINTS (1 << 0)
void __lvp_finishme(const char *file, int line, const char *format, ...)
lvp_printflike(3, 4);
#define lvp_finishme(format, ...) \
__lvp_finishme(__FILE__, __LINE__, format, ##__VA_ARGS__);
#define stub_return(v) \
do { \
lvp_finishme("stub %s", __func__); \
return (v); \
} while (0)
#define stub() \
do { \
lvp_finishme("stub %s", __func__); \
return; \
} while (0)
#define LVP_STAGE_MASK ((1 << MESA_SHADER_STAGES) - 1)
#define lvp_foreach_stage(stage, stage_bits) \
for (gl_shader_stage stage, \
__tmp = (gl_shader_stage)((stage_bits) & LVP_STAGE_MASK); \
stage = ffs(__tmp) - 1, __tmp; \
__tmp &= ~(1 << (stage)))
struct lvp_physical_device {
struct vk_physical_device vk;
struct pipe_loader_device *pld;
struct pipe_screen *pscreen;
uint32_t max_images;
VkPhysicalDeviceLimits device_limits;
struct wsi_device wsi_device;
};
struct lvp_instance {
struct vk_instance vk;
uint32_t apiVersion;
int physicalDeviceCount;
struct lvp_physical_device physicalDevice;
uint64_t debug_flags;
struct pipe_loader_device *devs;
int num_devices;
};
VkResult lvp_init_wsi(struct lvp_physical_device *physical_device);
void lvp_finish_wsi(struct lvp_physical_device *physical_device);
bool lvp_physical_device_extension_supported(struct lvp_physical_device *dev,
const char *name);
struct lvp_queue {
struct vk_queue vk;
struct lvp_device * device;
struct pipe_context *ctx;
struct cso_context *cso;
struct u_upload_mgr *uploader;
bool shutdown;
uint64_t timeline;
struct util_queue queue;
simple_mtx_t last_lock;
uint64_t last_finished;
uint64_t last_fence_timeline;
struct pipe_fence_handle *last_fence;
volatile int count;
void *state;
};
struct lvp_semaphore_wait {
struct lvp_semaphore *sema;
uint64_t wait;
};
struct lvp_queue_work {
struct list_head list;
uint32_t cmd_buffer_count;
uint32_t timeline_count;
uint32_t wait_count;
uint32_t signal_count;
uint64_t timeline;
struct lvp_fence *fence;
struct lvp_cmd_buffer **cmd_buffers;
struct lvp_semaphore_timeline **timelines;
struct lvp_semaphore **signals;
VkSemaphore *waits;
uint64_t *wait_vals;
};
struct lvp_pipeline_cache {
struct vk_object_base base;
struct lvp_device * device;
VkAllocationCallbacks alloc;
};
struct lvp_device {
struct vk_device vk;
struct lvp_queue queue;
struct lvp_instance * instance;
struct lvp_physical_device *physical_device;
struct pipe_screen *pscreen;
};
void lvp_device_get_cache_uuid(void *uuid);
enum lvp_device_memory_type {
LVP_DEVICE_MEMORY_TYPE_DEFAULT,
LVP_DEVICE_MEMORY_TYPE_USER_PTR,
LVP_DEVICE_MEMORY_TYPE_OPAQUE_FD,
};
struct lvp_device_memory {
struct vk_object_base base;
struct pipe_memory_allocation *pmem;
uint32_t type_index;
VkDeviceSize map_size;
void * map;
enum lvp_device_memory_type memory_type;
int backed_fd;
};
struct lvp_image {
struct vk_image vk;
VkDeviceSize size;
uint32_t alignment;
struct pipe_memory_allocation *pmem;
unsigned memory_offset;
struct pipe_resource *bo;
};
struct lvp_image_view {
struct vk_image_view vk;
const struct lvp_image *image; /**< VkImageViewCreateInfo::image */
enum pipe_format pformat;
struct pipe_surface *surface; /* have we created a pipe surface for this? */
};
struct lvp_sampler {
struct vk_object_base base;
VkSamplerCreateInfo create_info;
union pipe_color_union border_color;
VkSamplerReductionMode reduction_mode;
uint32_t state[4];
};
struct lvp_descriptor_set_binding_layout {
uint16_t descriptor_index;
/* Number of array elements in this binding */
VkDescriptorType type;
uint16_t array_size;
bool valid;
int16_t dynamic_index;
struct {
int16_t const_buffer_index;
int16_t shader_buffer_index;
int16_t sampler_index;
int16_t sampler_view_index;
int16_t image_index;
int16_t uniform_block_index;
int16_t uniform_block_offset;
} stage[MESA_SHADER_STAGES];
/* Immutable samplers (or NULL if no immutable samplers) */
struct lvp_sampler **immutable_samplers;
};
struct lvp_descriptor_set_layout {
struct vk_object_base base;
/* Descriptor set layouts can be destroyed at almost any time */
uint32_t ref_cnt;
uint32_t immutable_sampler_count;
/* Number of bindings in this descriptor set */
uint16_t binding_count;
/* Total size of the descriptor set with room for all array entries */
uint16_t size;
/* Shader stages affected by this descriptor set */
uint16_t shader_stages;
struct {
uint16_t const_buffer_count;
uint16_t shader_buffer_count;
uint16_t sampler_count;
uint16_t sampler_view_count;
uint16_t image_count;
uint16_t uniform_block_count;
uint16_t uniform_block_size;
uint16_t uniform_block_sizes[MAX_PER_STAGE_DESCRIPTOR_UNIFORM_BLOCKS]; //zero-indexed
} stage[MESA_SHADER_STAGES];
/* Number of dynamic offsets used by this descriptor set */
uint16_t dynamic_offset_count;
/* Bindings in this descriptor set */
struct lvp_descriptor_set_binding_layout binding[0];
};
void lvp_descriptor_set_layout_destroy(struct lvp_device *device,
struct lvp_descriptor_set_layout *layout);
static inline void
lvp_descriptor_set_layout_ref(struct lvp_descriptor_set_layout *layout)
{
assert(layout && layout->ref_cnt >= 1);
p_atomic_inc(&layout->ref_cnt);
}
static inline void
lvp_descriptor_set_layout_unref(struct lvp_device *device,
struct lvp_descriptor_set_layout *layout)
{
assert(layout && layout->ref_cnt >= 1);
if (p_atomic_dec_zero(&layout->ref_cnt))
lvp_descriptor_set_layout_destroy(device, layout);
}
union lvp_descriptor_info {
struct {
struct lvp_sampler *sampler;
struct lvp_image_view *iview;
VkImageLayout image_layout;
};
struct {
struct lvp_buffer *buffer;
VkDeviceSize offset;
VkDeviceSize range;
};
struct lvp_buffer_view *buffer_view;
uint8_t *uniform;
};
struct lvp_descriptor {
VkDescriptorType type;
union lvp_descriptor_info info;
};
struct lvp_descriptor_set {
struct vk_object_base base;
struct lvp_descriptor_set_layout *layout;
struct list_head link;
struct lvp_descriptor descriptors[0];
};
struct lvp_descriptor_pool {
struct vk_object_base base;
VkDescriptorPoolCreateFlags flags;
uint32_t max_sets;
struct list_head sets;
};
struct lvp_descriptor_update_template {
struct vk_object_base base;
uint32_t entry_count;
uint32_t set;
VkDescriptorUpdateTemplateType type;
VkPipelineBindPoint bind_point;
struct lvp_pipeline_layout *pipeline_layout;
VkDescriptorUpdateTemplateEntry entry[0];
};
VkResult
lvp_descriptor_set_create(struct lvp_device *device,
struct lvp_descriptor_set_layout *layout,
struct lvp_descriptor_set **out_set);
void
lvp_descriptor_set_destroy(struct lvp_device *device,
struct lvp_descriptor_set *set);
struct lvp_pipeline_layout {
struct vk_object_base base;
/* Pipeline layouts can be destroyed at almost any time */
uint32_t ref_cnt;
struct {
struct lvp_descriptor_set_layout *layout;
} set[MAX_SETS];
uint32_t num_sets;
uint32_t push_constant_size;
VkShaderStageFlags push_constant_stages;
struct {
uint16_t uniform_block_size;
uint16_t uniform_block_count;
uint16_t uniform_block_sizes[MAX_PER_STAGE_DESCRIPTOR_UNIFORM_BLOCKS * MAX_SETS];
} stage[MESA_SHADER_STAGES];
};
void lvp_pipeline_layout_destroy(struct lvp_device *device,
struct lvp_pipeline_layout *layout);
static inline void
lvp_pipeline_layout_ref(struct lvp_pipeline_layout *layout)
{
assert(layout && layout->ref_cnt >= 1);
p_atomic_inc(&layout->ref_cnt);
}
static inline void
lvp_pipeline_layout_unref(struct lvp_device *device,
struct lvp_pipeline_layout *layout)
{
assert(layout && layout->ref_cnt >= 1);
if (p_atomic_dec_zero(&layout->ref_cnt))
lvp_pipeline_layout_destroy(device, layout);
}
struct lvp_access_info {
uint32_t images_read;
uint32_t images_written;
uint32_t buffers_written;
};
struct lvp_pipeline {
struct vk_object_base base;
struct lvp_device * device;
struct lvp_pipeline_layout * layout;
struct lvp_access_info access[MESA_SHADER_STAGES];
void *mem_ctx;
bool is_compute_pipeline;
bool force_min_sample;
nir_shader *pipeline_nir[MESA_SHADER_STAGES];
void *shader_cso[PIPE_SHADER_TYPES];
VkGraphicsPipelineCreateInfo graphics_create_info;
VkComputePipelineCreateInfo compute_create_info;
uint32_t line_stipple_factor;
uint16_t line_stipple_pattern;
bool line_stipple_enable;
bool line_smooth;
bool disable_multisample;
bool line_rectangular;
bool gs_output_lines;
bool provoking_vertex_last;
bool negative_one_to_one;
};
struct lvp_event {
struct vk_object_base base;
volatile uint64_t event_storage;
};
struct lvp_fence {
struct vk_object_base base;
uint64_t timeline;
struct util_queue_fence fence;
struct pipe_fence_handle *handle;
bool signalled;
};
struct lvp_semaphore_timeline {
struct lvp_semaphore_timeline *next;
uint64_t signal; //api
uint64_t timeline; //queue
struct pipe_fence_handle *fence;
};
struct lvp_semaphore {
struct vk_object_base base;
bool is_timeline;
uint64_t current;
simple_mtx_t lock;
mtx_t submit_lock;
cnd_t submit;
void *mem;
struct util_dynarray links;
struct lvp_semaphore_timeline *timeline;
struct lvp_semaphore_timeline *latest;
struct pipe_fence_handle *handle;
};
struct lvp_queue_noop {
struct lvp_fence *fence;
struct lvp_semaphore *sema;
};
struct lvp_buffer {
struct vk_object_base base;
VkDeviceSize size;
VkBufferUsageFlags usage;
VkDeviceSize offset;
struct pipe_memory_allocation *pmem;
struct pipe_resource *bo;
uint64_t total_size;
};
struct lvp_buffer_view {
struct vk_object_base base;
VkFormat format;
enum pipe_format pformat;
struct lvp_buffer *buffer;
uint32_t offset;
uint64_t range;
};
struct lvp_query_pool {
struct vk_object_base base;
VkQueryType type;
uint32_t count;
VkQueryPipelineStatisticFlags pipeline_stats;
enum pipe_query_type base_type;
struct pipe_query *queries[0];
};
struct lvp_cmd_pool {
struct vk_command_pool vk;
struct list_head cmd_buffers;
struct list_head free_cmd_buffers;
};
enum lvp_cmd_buffer_status {
LVP_CMD_BUFFER_STATUS_INVALID,
LVP_CMD_BUFFER_STATUS_INITIAL,
LVP_CMD_BUFFER_STATUS_RECORDING,
LVP_CMD_BUFFER_STATUS_EXECUTABLE,
LVP_CMD_BUFFER_STATUS_PENDING,
};
struct lvp_cmd_buffer {
struct vk_command_buffer vk;
struct lvp_device * device;
enum lvp_cmd_buffer_status status;
struct lvp_cmd_pool * pool;
struct list_head pool_link;
uint8_t push_constants[MAX_PUSH_CONSTANTS_SIZE];
};
#define LVP_FROM_HANDLE(__lvp_type, __name, __handle) \
struct __lvp_type *__name = __lvp_type ## _from_handle(__handle)
VK_DEFINE_HANDLE_CASTS(lvp_cmd_buffer, vk.base, VkCommandBuffer,
VK_OBJECT_TYPE_COMMAND_BUFFER)
VK_DEFINE_HANDLE_CASTS(lvp_device, vk.base, VkDevice, VK_OBJECT_TYPE_DEVICE)
VK_DEFINE_HANDLE_CASTS(lvp_instance, vk.base, VkInstance, VK_OBJECT_TYPE_INSTANCE)
VK_DEFINE_HANDLE_CASTS(lvp_physical_device, vk.base, VkPhysicalDevice,
VK_OBJECT_TYPE_PHYSICAL_DEVICE)
VK_DEFINE_HANDLE_CASTS(lvp_queue, vk.base, VkQueue, VK_OBJECT_TYPE_QUEUE)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_cmd_pool, vk.base, VkCommandPool,
VK_OBJECT_TYPE_COMMAND_POOL)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_buffer, base, VkBuffer,
VK_OBJECT_TYPE_BUFFER)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_buffer_view, base, VkBufferView,
VK_OBJECT_TYPE_BUFFER_VIEW)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_descriptor_pool, base, VkDescriptorPool,
VK_OBJECT_TYPE_DESCRIPTOR_POOL)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_descriptor_set, base, VkDescriptorSet,
VK_OBJECT_TYPE_DESCRIPTOR_SET)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_descriptor_set_layout, base, VkDescriptorSetLayout,
VK_OBJECT_TYPE_DESCRIPTOR_SET_LAYOUT)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_descriptor_update_template, base, VkDescriptorUpdateTemplate,
VK_OBJECT_TYPE_DESCRIPTOR_UPDATE_TEMPLATE)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_device_memory, base, VkDeviceMemory,
VK_OBJECT_TYPE_DEVICE_MEMORY)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_event, base, VkEvent, VK_OBJECT_TYPE_EVENT)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_image, vk.base, VkImage, VK_OBJECT_TYPE_IMAGE)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_image_view, vk.base, VkImageView,
VK_OBJECT_TYPE_IMAGE_VIEW);
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_pipeline_cache, base, VkPipelineCache,
VK_OBJECT_TYPE_PIPELINE_CACHE)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_pipeline, base, VkPipeline,
VK_OBJECT_TYPE_PIPELINE)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_pipeline_layout, base, VkPipelineLayout,
VK_OBJECT_TYPE_PIPELINE_LAYOUT)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_query_pool, base, VkQueryPool,
VK_OBJECT_TYPE_QUERY_POOL)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_sampler, base, VkSampler,
VK_OBJECT_TYPE_SAMPLER)
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_fence, base, VkFence, VK_OBJECT_TYPE_FENCE);
VK_DEFINE_NONDISP_HANDLE_CASTS(lvp_semaphore, base, VkSemaphore,
VK_OBJECT_TYPE_SEMAPHORE);
struct lvp_write_descriptor {
uint32_t dst_binding;
uint32_t dst_array_element;
uint32_t descriptor_count;
VkDescriptorType descriptor_type;
};
struct lvp_cmd_push_descriptor_set {
VkPipelineBindPoint bind_point;
struct lvp_pipeline_layout *layout;
uint32_t set;
uint32_t descriptor_write_count;
struct lvp_write_descriptor *descriptors;
union lvp_descriptor_info *infos;
};
void lvp_add_enqueue_cmd_entrypoints(struct vk_device_dispatch_table *disp);
VkResult lvp_execute_cmds(struct lvp_device *device,
struct lvp_queue *queue,
struct lvp_cmd_buffer *cmd_buffer);
size_t
lvp_get_rendering_state_size(void);
struct lvp_image *lvp_swapchain_get_image(VkSwapchainKHR swapchain,
uint32_t index);
static inline enum pipe_format
lvp_vk_format_to_pipe_format(VkFormat format)
{
/* Some formats cause problems with CTS right now.*/
if (format == VK_FORMAT_R4G4B4A4_UNORM_PACK16 ||
format == VK_FORMAT_R5G5B5A1_UNORM_PACK16 ||
format == VK_FORMAT_R8_SRGB ||
format == VK_FORMAT_R8G8_SRGB ||
format == VK_FORMAT_R64G64B64A64_SFLOAT ||
format == VK_FORMAT_R64_SFLOAT ||
format == VK_FORMAT_R64G64_SFLOAT ||
format == VK_FORMAT_R64G64B64_SFLOAT ||
format == VK_FORMAT_A2R10G10B10_SINT_PACK32 ||
format == VK_FORMAT_A2B10G10R10_SINT_PACK32 ||
format == VK_FORMAT_G8B8G8R8_422_UNORM ||
format == VK_FORMAT_B8G8R8G8_422_UNORM ||
format == VK_FORMAT_G8_B8_R8_3PLANE_420_UNORM ||
format == VK_FORMAT_G8_B8R8_2PLANE_420_UNORM ||
format == VK_FORMAT_G8_B8_R8_3PLANE_422_UNORM ||
format == VK_FORMAT_G8_B8R8_2PLANE_422_UNORM ||
format == VK_FORMAT_G8_B8_R8_3PLANE_444_UNORM ||
format == VK_FORMAT_G16_B16_R16_3PLANE_420_UNORM ||
format == VK_FORMAT_G16_B16R16_2PLANE_420_UNORM ||
format == VK_FORMAT_G16_B16_R16_3PLANE_422_UNORM ||
format == VK_FORMAT_G16_B16R16_2PLANE_422_UNORM ||
format == VK_FORMAT_G16_B16_R16_3PLANE_444_UNORM ||
format == VK_FORMAT_D16_UNORM_S8_UINT)
return PIPE_FORMAT_NONE;
return vk_format_to_pipe_format(format);
}
void
queue_thread_noop(void *data, void *gdata, int thread_index);
#ifdef __cplusplus
}
#endif