/* * Copyright © 2014-2017 Broadcom * Copyright (C) 2012 Rob Clark * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. */ #include #include "common/v3d_device_info.h" #include "common/v3d_limits.h" #include "util/os_misc.h" #include "pipe/p_defines.h" #include "pipe/p_screen.h" #include "pipe/p_state.h" #include "util/u_debug.h" #include "util/u_memory.h" #include "util/format/u_format.h" #include "util/u_hash_table.h" #include "util/u_screen.h" #include "util/u_transfer_helper.h" #include "util/ralloc.h" #include "util/xmlconfig.h" #include #include "v3d_screen.h" #include "v3d_context.h" #include "v3d_resource.h" #include "compiler/v3d_compiler.h" #include "drm-uapi/drm_fourcc.h" static const char * v3d_screen_get_name(struct pipe_screen *pscreen) { struct v3d_screen *screen = v3d_screen(pscreen); if (!screen->name) { screen->name = ralloc_asprintf(screen, "V3D %d.%d", screen->devinfo.ver / 10, screen->devinfo.ver % 10); } return screen->name; } static const char * v3d_screen_get_vendor(struct pipe_screen *pscreen) { return "Broadcom"; } static void v3d_screen_destroy(struct pipe_screen *pscreen) { struct v3d_screen *screen = v3d_screen(pscreen); _mesa_hash_table_destroy(screen->bo_handles, NULL); v3d_bufmgr_destroy(pscreen); slab_destroy_parent(&screen->transfer_pool); if (screen->ro) screen->ro->destroy(screen->ro); if (using_v3d_simulator) v3d_simulator_destroy(screen->sim_file); v3d_compiler_free(screen->compiler); #ifdef ENABLE_SHADER_CACHE if (screen->disk_cache) disk_cache_destroy(screen->disk_cache); #endif u_transfer_helper_destroy(pscreen->transfer_helper); close(screen->fd); ralloc_free(pscreen); } static bool v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature) { struct drm_v3d_get_param p = { .param = feature, }; int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p); if (ret != 0) return false; return p.value; } static int v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param) { struct v3d_screen *screen = v3d_screen(pscreen); switch (param) { /* Supported features (boolean caps). */ case PIPE_CAP_VERTEX_COLOR_UNCLAMPED: case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT: case PIPE_CAP_NPOT_TEXTURES: case PIPE_CAP_BLEND_EQUATION_SEPARATE: case PIPE_CAP_TEXTURE_MULTISAMPLE: case PIPE_CAP_TEXTURE_SWIZZLE: case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR: case PIPE_CAP_START_INSTANCE: case PIPE_CAP_VS_INSTANCEID: case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD: case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES: case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX: case PIPE_CAP_EMULATE_NONFIXED_PRIMITIVE_RESTART: case PIPE_CAP_PRIMITIVE_RESTART: case PIPE_CAP_OCCLUSION_QUERY: case PIPE_CAP_POINT_SPRITE: case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME: case PIPE_CAP_DRAW_INDIRECT: case PIPE_CAP_MULTI_DRAW_INDIRECT: case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION: case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET: case PIPE_CAP_SHADER_CAN_READ_OUTPUTS: case PIPE_CAP_SHADER_PACK_HALF_FLOAT: case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR: case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT: case PIPE_CAP_FS_FACE_IS_INTEGER_SYSVAL: case PIPE_CAP_TGSI_TEXCOORD: case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE: case PIPE_CAP_SAMPLER_VIEW_TARGET: case PIPE_CAP_ANISOTROPIC_FILTER: case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS: case PIPE_CAP_INDEP_BLEND_FUNC: return 1; case PIPE_CAP_POLYGON_OFFSET_CLAMP: return screen->devinfo.ver >= 41; case PIPE_CAP_TEXTURE_QUERY_LOD: return screen->devinfo.ver >= 42; break; case PIPE_CAP_PACKED_UNIFORMS: /* We can't enable this flag, because it results in load_ubo * intrinsics across a 16b boundary, but v3d's TMU general * memory accesses wrap on 16b boundaries. */ return 0; case PIPE_CAP_NIR_IMAGES_AS_DEREF: return 0; case PIPE_CAP_TEXTURE_TRANSFER_MODES: /* XXX perf: we don't want to emit these extra blits for * glReadPixels(), since we still have to do an uncached read * from the GPU of the result after waiting for the TFU blit * to happen. However, disabling this introduces instability * in * dEQP-GLES31.functional.image_load_store.early_fragment_tests.* * and corruption in chromium's rendering. */ return PIPE_TEXTURE_TRANSFER_BLIT; case PIPE_CAP_COMPUTE: return screen->has_csd && screen->devinfo.ver >= 41; case PIPE_CAP_GENERATE_MIPMAP: return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU); case PIPE_CAP_INDEP_BLEND_ENABLE: return screen->devinfo.ver >= 40; case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT: return V3D_NON_COHERENT_ATOM_SIZE; case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS: if (screen->devinfo.ver < 40) return 0; return 4; case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT: if (screen->has_cache_flush) return 4; else return 0; /* Disables shader storage */ case PIPE_CAP_GLSL_FEATURE_LEVEL: return 330; case PIPE_CAP_ESSL_FEATURE_LEVEL: return 310; case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY: return 140; case PIPE_CAP_FS_COORD_ORIGIN_UPPER_LEFT: return 1; case PIPE_CAP_FS_COORD_ORIGIN_LOWER_LEFT: return 0; case PIPE_CAP_FS_COORD_PIXEL_CENTER_INTEGER: if (screen->devinfo.ver >= 40) return 0; else return 1; case PIPE_CAP_FS_COORD_PIXEL_CENTER_HALF_INTEGER: if (screen->devinfo.ver >= 40) return 1; else return 0; case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES: case PIPE_CAP_MIXED_COLORBUFFER_FORMATS: case PIPE_CAP_MIXED_COLOR_DEPTH_BITS: return 1; case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS: return 4; case PIPE_CAP_MAX_VARYINGS: return V3D_MAX_FS_INPUTS / 4; /* Texturing. */ case PIPE_CAP_MAX_TEXTURE_2D_SIZE: if (screen->devinfo.ver < 40) return 2048; else if (screen->nonmsaa_texture_size_limit) return 7680; else return V3D_MAX_IMAGE_DIMENSION; case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS: case PIPE_CAP_MAX_TEXTURE_3D_LEVELS: if (screen->devinfo.ver < 40) return 12; else return V3D_MAX_MIP_LEVELS; case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: return V3D_MAX_ARRAY_LAYERS; /* Render targets. */ case PIPE_CAP_MAX_RENDER_TARGETS: return 4; case PIPE_CAP_VENDOR_ID: return 0x14E4; case PIPE_CAP_ACCELERATED: return 1; case PIPE_CAP_VIDEO_MEMORY: { uint64_t system_memory; if (!os_get_total_physical_memory(&system_memory)) return 0; return (int)(system_memory >> 20); } case PIPE_CAP_UMA: return 1; case PIPE_CAP_ALPHA_TEST: case PIPE_CAP_FLATSHADE: case PIPE_CAP_TWO_SIDED_COLOR: case PIPE_CAP_VERTEX_COLOR_CLAMPED: case PIPE_CAP_FRAGMENT_COLOR_CLAMPED: case PIPE_CAP_GL_CLAMP: return 0; /* Geometry shaders */ case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS: /* Minimum required by GLES 3.2 */ return 1024; case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES: /* MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS / 4 */ return 256; case PIPE_CAP_MAX_GS_INVOCATIONS: return 32; case PIPE_CAP_SUPPORTED_PRIM_MODES: case PIPE_CAP_SUPPORTED_PRIM_MODES_WITH_RESTART: return screen->prim_types; case PIPE_CAP_TEXTURE_BUFFER_OBJECTS: return true; case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT: return 256; case PIPE_CAP_IMAGE_STORE_FORMATTED: return false; default: return u_pipe_screen_get_param_defaults(pscreen, param); } } static float v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param) { switch (param) { case PIPE_CAPF_MIN_LINE_WIDTH: case PIPE_CAPF_MIN_LINE_WIDTH_AA: case PIPE_CAPF_MIN_POINT_SIZE: case PIPE_CAPF_MIN_POINT_SIZE_AA: return 1; case PIPE_CAPF_POINT_SIZE_GRANULARITY: case PIPE_CAPF_LINE_WIDTH_GRANULARITY: return 0.1; case PIPE_CAPF_MAX_LINE_WIDTH: case PIPE_CAPF_MAX_LINE_WIDTH_AA: return V3D_MAX_LINE_WIDTH; case PIPE_CAPF_MAX_POINT_SIZE: case PIPE_CAPF_MAX_POINT_SIZE_AA: return V3D_MAX_POINT_SIZE; case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY: return 16.0f; case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS: return 16.0f; case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE: case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE: case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY: return 0.0f; default: fprintf(stderr, "unknown paramf %d\n", param); return 0; } } static int v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param) { struct v3d_screen *screen = v3d_screen(pscreen); switch (shader) { case PIPE_SHADER_VERTEX: case PIPE_SHADER_FRAGMENT: break; case PIPE_SHADER_COMPUTE: if (!screen->has_csd) return 0; break; case PIPE_SHADER_GEOMETRY: if (screen->devinfo.ver < 41) return 0; break; default: return 0; } /* this is probably not totally correct.. but it's a start: */ switch (param) { case PIPE_SHADER_CAP_MAX_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS: return 16384; case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH: return UINT_MAX; case PIPE_SHADER_CAP_MAX_INPUTS: switch (shader) { case PIPE_SHADER_VERTEX: return V3D_MAX_VS_INPUTS / 4; case PIPE_SHADER_GEOMETRY: return V3D_MAX_GS_INPUTS / 4; case PIPE_SHADER_FRAGMENT: return V3D_MAX_FS_INPUTS / 4; default: return 0; }; case PIPE_SHADER_CAP_MAX_OUTPUTS: if (shader == PIPE_SHADER_FRAGMENT) return 4; else return V3D_MAX_FS_INPUTS / 4; case PIPE_SHADER_CAP_MAX_TEMPS: return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */ case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE: /* Note: Limited by the offset size in * v3d_unit_data_create(). */ return 16 * 1024 * sizeof(float); case PIPE_SHADER_CAP_MAX_CONST_BUFFERS: return 16; case PIPE_SHADER_CAP_CONT_SUPPORTED: return 0; case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR: /* We don't currently support this in the backend, but that is * okay because our NIR compiler sets the option * lower_all_io_to_temps, which will eliminate indirect * indexing on all input/output variables by translating it to * indirect indexing on temporary variables instead, which we * will then lower to scratch. We prefer this over setting this * to 0, which would cause if-ladder injection to eliminate * indirect indexing on inputs. */ return 1; case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR: return 1; case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR: return 1; case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR: return 1; case PIPE_SHADER_CAP_SUBROUTINES: return 0; case PIPE_SHADER_CAP_INTEGERS: return 1; case PIPE_SHADER_CAP_FP16: case PIPE_SHADER_CAP_FP16_DERIVATIVES: case PIPE_SHADER_CAP_FP16_CONST_BUFFERS: case PIPE_SHADER_CAP_INT16: case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS: case PIPE_SHADER_CAP_DROUND_SUPPORTED: case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED: case PIPE_SHADER_CAP_LDEXP_SUPPORTED: case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE: case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED: case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS: case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS: return 0; case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS: case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS: return V3D_MAX_TEXTURE_SAMPLERS; case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS: if (screen->has_cache_flush) { if (shader == PIPE_SHADER_VERTEX || shader == PIPE_SHADER_GEOMETRY) { return 0; } return PIPE_MAX_SHADER_BUFFERS; } else { return 0; } case PIPE_SHADER_CAP_MAX_SHADER_IMAGES: if (screen->has_cache_flush) { if (screen->devinfo.ver < 41) return 0; else return PIPE_MAX_SHADER_IMAGES; } else { return 0; } case PIPE_SHADER_CAP_PREFERRED_IR: return PIPE_SHADER_IR_NIR; case PIPE_SHADER_CAP_SUPPORTED_IRS: return 1 << PIPE_SHADER_IR_NIR; default: fprintf(stderr, "unknown shader param %d\n", param); return 0; } return 0; } static int v3d_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type, enum pipe_compute_cap param, void *ret) { struct v3d_screen *screen = v3d_screen(pscreen); if (!screen->has_csd) return 0; #define RET(x) do { \ if (ret) \ memcpy(ret, x, sizeof(x)); \ return sizeof(x); \ } while (0) switch (param) { case PIPE_COMPUTE_CAP_ADDRESS_BITS: RET((uint32_t []) { 32 }); break; case PIPE_COMPUTE_CAP_IR_TARGET: sprintf(ret, "v3d"); return strlen(ret); case PIPE_COMPUTE_CAP_GRID_DIMENSION: RET((uint64_t []) { 3 }); case PIPE_COMPUTE_CAP_MAX_GRID_SIZE: /* GL_MAX_COMPUTE_SHADER_WORK_GROUP_COUNT: The CSD has a * 16-bit field for the number of workgroups in each * dimension. */ RET(((uint64_t []) { 65535, 65535, 65535 })); case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE: /* GL_MAX_COMPUTE_WORK_GROUP_SIZE */ RET(((uint64_t []) { 256, 256, 256 })); case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK: case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK: /* GL_MAX_COMPUTE_WORK_GROUP_INVOCATIONS: This is * limited by WG_SIZE in the CSD. */ RET((uint64_t []) { 256 }); case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE: RET((uint64_t []) { 1024 * 1024 * 1024 }); case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE: /* GL_MAX_COMPUTE_SHARED_MEMORY_SIZE */ RET((uint64_t []) { 32768 }); case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE: case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE: RET((uint64_t []) { 4096 }); case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE: { struct sysinfo si; sysinfo(&si); RET((uint64_t []) { si.totalram }); } case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY: /* OpenCL only */ RET((uint32_t []) { 0 }); case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS: RET((uint32_t []) { 1 }); case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED: RET((uint32_t []) { 1 }); case PIPE_COMPUTE_CAP_SUBGROUP_SIZE: RET((uint32_t []) { 16 }); } return 0; } static bool v3d_screen_is_format_supported(struct pipe_screen *pscreen, enum pipe_format format, enum pipe_texture_target target, unsigned sample_count, unsigned storage_sample_count, unsigned usage) { struct v3d_screen *screen = v3d_screen(pscreen); if (MAX2(1, sample_count) != MAX2(1, storage_sample_count)) return false; if (sample_count > 1 && sample_count != V3D_MAX_SAMPLES) return false; if (target >= PIPE_MAX_TEXTURE_TYPES) { return false; } if (usage & PIPE_BIND_VERTEX_BUFFER) { switch (format) { case PIPE_FORMAT_R32G32B32A32_FLOAT: case PIPE_FORMAT_R32G32B32_FLOAT: case PIPE_FORMAT_R32G32_FLOAT: case PIPE_FORMAT_R32_FLOAT: case PIPE_FORMAT_R32G32B32A32_SNORM: case PIPE_FORMAT_R32G32B32_SNORM: case PIPE_FORMAT_R32G32_SNORM: case PIPE_FORMAT_R32_SNORM: case PIPE_FORMAT_R32G32B32A32_SSCALED: case PIPE_FORMAT_R32G32B32_SSCALED: case PIPE_FORMAT_R32G32_SSCALED: case PIPE_FORMAT_R32_SSCALED: case PIPE_FORMAT_R16G16B16A16_UNORM: case PIPE_FORMAT_R16G16B16_UNORM: case PIPE_FORMAT_R16G16_UNORM: case PIPE_FORMAT_R16_UNORM: case PIPE_FORMAT_R16G16B16A16_SNORM: case PIPE_FORMAT_R16G16B16_SNORM: case PIPE_FORMAT_R16G16_SNORM: case PIPE_FORMAT_R16_SNORM: case PIPE_FORMAT_R16G16B16A16_USCALED: case PIPE_FORMAT_R16G16B16_USCALED: case PIPE_FORMAT_R16G16_USCALED: case PIPE_FORMAT_R16_USCALED: case PIPE_FORMAT_R16G16B16A16_SSCALED: case PIPE_FORMAT_R16G16B16_SSCALED: case PIPE_FORMAT_R16G16_SSCALED: case PIPE_FORMAT_R16_SSCALED: case PIPE_FORMAT_B8G8R8A8_UNORM: case PIPE_FORMAT_R8G8B8A8_UNORM: case PIPE_FORMAT_R8G8B8_UNORM: case PIPE_FORMAT_R8G8_UNORM: case PIPE_FORMAT_R8_UNORM: case PIPE_FORMAT_R8G8B8A8_SNORM: case PIPE_FORMAT_R8G8B8_SNORM: case PIPE_FORMAT_R8G8_SNORM: case PIPE_FORMAT_R8_SNORM: case PIPE_FORMAT_R8G8B8A8_USCALED: case PIPE_FORMAT_R8G8B8_USCALED: case PIPE_FORMAT_R8G8_USCALED: case PIPE_FORMAT_R8_USCALED: case PIPE_FORMAT_R8G8B8A8_SSCALED: case PIPE_FORMAT_R8G8B8_SSCALED: case PIPE_FORMAT_R8G8_SSCALED: case PIPE_FORMAT_R8_SSCALED: case PIPE_FORMAT_R10G10B10A2_UNORM: case PIPE_FORMAT_B10G10R10A2_UNORM: case PIPE_FORMAT_R10G10B10A2_SNORM: case PIPE_FORMAT_B10G10R10A2_SNORM: case PIPE_FORMAT_R10G10B10A2_USCALED: case PIPE_FORMAT_B10G10R10A2_USCALED: case PIPE_FORMAT_R10G10B10A2_SSCALED: case PIPE_FORMAT_B10G10R10A2_SSCALED: break; default: return false; } } /* FORMAT_NONE gets allowed for ARB_framebuffer_no_attachments's probe * of FRAMEBUFFER_MAX_SAMPLES */ if ((usage & PIPE_BIND_RENDER_TARGET) && format != PIPE_FORMAT_NONE && !v3d_rt_format_supported(&screen->devinfo, format)) { return false; } if ((usage & PIPE_BIND_SAMPLER_VIEW) && !v3d_tex_format_supported(&screen->devinfo, format)) { return false; } if ((usage & PIPE_BIND_DEPTH_STENCIL) && !(format == PIPE_FORMAT_S8_UINT_Z24_UNORM || format == PIPE_FORMAT_X8Z24_UNORM || format == PIPE_FORMAT_Z16_UNORM || format == PIPE_FORMAT_Z32_FLOAT || format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) { return false; } if ((usage & PIPE_BIND_INDEX_BUFFER) && !(format == PIPE_FORMAT_R8_UINT || format == PIPE_FORMAT_R16_UINT || format == PIPE_FORMAT_R32_UINT)) { return false; } if (usage & PIPE_BIND_SHADER_IMAGE) { switch (format) { /* FIXME: maybe we can implement a swizzle-on-writes to add * support for BGRA-alike formats. */ case PIPE_FORMAT_A4B4G4R4_UNORM: case PIPE_FORMAT_A1B5G5R5_UNORM: case PIPE_FORMAT_B5G6R5_UNORM: case PIPE_FORMAT_B8G8R8A8_UNORM: case PIPE_FORMAT_X8Z24_UNORM: case PIPE_FORMAT_Z16_UNORM: return false; default: return true; } } return true; } static const nir_shader_compiler_options v3d_nir_options = { .lower_uadd_sat = true, .lower_usub_sat = true, .lower_iadd_sat = true, .lower_all_io_to_temps = true, .lower_extract_byte = true, .lower_extract_word = true, .lower_insert_byte = true, .lower_insert_word = true, .lower_bitfield_insert_to_shifts = true, .lower_bitfield_extract_to_shifts = true, .lower_bitfield_reverse = true, .lower_bit_count = true, .lower_cs_local_id_to_index = true, .lower_ffract = true, .lower_fmod = true, .lower_pack_unorm_2x16 = true, .lower_pack_snorm_2x16 = true, .lower_pack_unorm_4x8 = true, .lower_pack_snorm_4x8 = true, .lower_unpack_unorm_4x8 = true, .lower_unpack_snorm_4x8 = true, .lower_pack_half_2x16 = true, .lower_unpack_half_2x16 = true, .lower_pack_32_2x16 = true, .lower_pack_32_2x16_split = true, .lower_unpack_32_2x16_split = true, .lower_fdiv = true, .lower_find_lsb = true, .lower_ffma16 = true, .lower_ffma32 = true, .lower_ffma64 = true, .lower_flrp32 = true, .lower_fpow = true, .lower_fsat = true, .lower_fsqrt = true, .lower_ifind_msb = true, .lower_isign = true, .lower_ldexp = true, .lower_mul_high = true, .lower_wpos_pntc = true, .lower_rotate = true, .lower_to_scalar = true, .lower_int64_options = nir_lower_imul_2x32_64, .has_fsub = true, .has_isub = true, .divergence_analysis_options = nir_divergence_multiple_workgroup_per_compute_subgroup, /* This will enable loop unrolling in the state tracker so we won't * be able to selectively disable it in backend if it leads to * lower thread counts or TMU spills. Choose a conservative maximum to * limit register pressure impact. */ .max_unroll_iterations = 16, .force_indirect_unrolling_sampler = true, }; static const void * v3d_screen_get_compiler_options(struct pipe_screen *pscreen, enum pipe_shader_ir ir, unsigned shader) { return &v3d_nir_options; } static const uint64_t v3d_available_modifiers[] = { DRM_FORMAT_MOD_BROADCOM_UIF, DRM_FORMAT_MOD_LINEAR, DRM_FORMAT_MOD_BROADCOM_SAND128, }; static void v3d_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen, enum pipe_format format, int max, uint64_t *modifiers, unsigned int *external_only, int *count) { int i; int num_modifiers = ARRAY_SIZE(v3d_available_modifiers); /* Expose DRM_FORMAT_MOD_BROADCOM_SAND128 only for PIPE_FORMAT_NV12 */ if (format != PIPE_FORMAT_NV12) num_modifiers--; if (!modifiers) { *count = num_modifiers; return; } *count = MIN2(max, num_modifiers); for (i = 0; i < *count; i++) { modifiers[i] = v3d_available_modifiers[i]; if (external_only) external_only[i] = util_format_is_yuv(format); } } static bool v3d_screen_is_dmabuf_modifier_supported(struct pipe_screen *pscreen, uint64_t modifier, enum pipe_format format, bool *external_only) { int i; bool is_sand_col128 = (format == PIPE_FORMAT_NV12) && (fourcc_mod_broadcom_mod(modifier) == DRM_FORMAT_MOD_BROADCOM_SAND128); if (is_sand_col128) { if (external_only) *external_only = true; return true; } /* We don't want to generally allow DRM_FORMAT_MOD_BROADCOM_SAND128 * modifier, that is the last v3d_available_modifiers. We only accept * it in the case of having a PIPE_FORMAT_NV12. */ assert(v3d_available_modifiers[ARRAY_SIZE(v3d_available_modifiers) - 1] == DRM_FORMAT_MOD_BROADCOM_SAND128); for (i = 0; i < ARRAY_SIZE(v3d_available_modifiers) - 1; i++) { if (v3d_available_modifiers[i] == modifier) { if (external_only) *external_only = util_format_is_yuv(format); return true; } } return false; } static enum pipe_format v3d_screen_get_compatible_tlb_format(struct pipe_screen *screen, enum pipe_format format) { switch (format) { case PIPE_FORMAT_R16G16_UNORM: return PIPE_FORMAT_R16G16_UINT; default: return format; } } static struct disk_cache * v3d_screen_get_disk_shader_cache(struct pipe_screen *pscreen) { struct v3d_screen *screen = v3d_screen(pscreen); return screen->disk_cache; } struct pipe_screen * v3d_screen_create(int fd, const struct pipe_screen_config *config, struct renderonly *ro) { struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen); struct pipe_screen *pscreen; pscreen = &screen->base; pscreen->destroy = v3d_screen_destroy; pscreen->get_param = v3d_screen_get_param; pscreen->get_paramf = v3d_screen_get_paramf; pscreen->get_shader_param = v3d_screen_get_shader_param; pscreen->get_compute_param = v3d_get_compute_param; pscreen->context_create = v3d_context_create; pscreen->is_format_supported = v3d_screen_is_format_supported; pscreen->get_canonical_format = v3d_screen_get_compatible_tlb_format; screen->fd = fd; screen->ro = ro; list_inithead(&screen->bo_cache.time_list); (void)mtx_init(&screen->bo_handles_mutex, mtx_plain); screen->bo_handles = util_hash_table_create_ptr_keys(); #if defined(USE_V3D_SIMULATOR) screen->sim_file = v3d_simulator_init(screen->fd); #endif if (!v3d_get_device_info(screen->fd, &screen->devinfo, &v3d_ioctl)) goto fail; driParseConfigFiles(config->options, config->options_info, 0, "v3d", NULL, NULL, NULL, 0, NULL, 0); /* We have to driCheckOption for the simulator mode to not assertion * fail on not having our XML config. */ const char *nonmsaa_name = "v3d_nonmsaa_texture_size_limit"; screen->nonmsaa_texture_size_limit = driCheckOption(config->options, nonmsaa_name, DRI_BOOL) && driQueryOptionb(config->options, nonmsaa_name); slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16); screen->has_csd = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CSD); screen->has_cache_flush = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CACHE_FLUSH); screen->has_perfmon = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_PERFMON); v3d_fence_init(screen); v3d_resource_screen_init(pscreen); screen->compiler = v3d_compiler_init(&screen->devinfo, 0); #ifdef ENABLE_SHADER_CACHE v3d_disk_cache_init(screen); #endif pscreen->get_name = v3d_screen_get_name; pscreen->get_vendor = v3d_screen_get_vendor; pscreen->get_device_vendor = v3d_screen_get_vendor; pscreen->get_compiler_options = v3d_screen_get_compiler_options; pscreen->get_disk_shader_cache = v3d_screen_get_disk_shader_cache; pscreen->query_dmabuf_modifiers = v3d_screen_query_dmabuf_modifiers; pscreen->is_dmabuf_modifier_supported = v3d_screen_is_dmabuf_modifier_supported; if (screen->has_perfmon) { pscreen->get_driver_query_group_info = v3d_get_driver_query_group_info; pscreen->get_driver_query_info = v3d_get_driver_query_info; } /* Generate the bitmask of supported draw primitives. */ screen->prim_types = BITFIELD_BIT(PIPE_PRIM_POINTS) | BITFIELD_BIT(PIPE_PRIM_LINES) | BITFIELD_BIT(PIPE_PRIM_LINE_LOOP) | BITFIELD_BIT(PIPE_PRIM_LINE_STRIP) | BITFIELD_BIT(PIPE_PRIM_TRIANGLES) | BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP) | BITFIELD_BIT(PIPE_PRIM_TRIANGLE_FAN) | BITFIELD_BIT(PIPE_PRIM_LINES_ADJACENCY) | BITFIELD_BIT(PIPE_PRIM_LINE_STRIP_ADJACENCY) | BITFIELD_BIT(PIPE_PRIM_TRIANGLES_ADJACENCY) | BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP_ADJACENCY); return pscreen; fail: close(fd); ralloc_free(pscreen); return NULL; }