936 lines
33 KiB
C
936 lines
33 KiB
C
/*
|
|
* Copyright © 2014-2017 Broadcom
|
|
* Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include <sys/sysinfo.h>
|
|
|
|
#include "common/v3d_device_info.h"
|
|
#include "common/v3d_limits.h"
|
|
#include "util/os_misc.h"
|
|
#include "pipe/p_defines.h"
|
|
#include "pipe/p_screen.h"
|
|
#include "pipe/p_state.h"
|
|
|
|
#include "util/u_debug.h"
|
|
#include "util/u_memory.h"
|
|
#include "util/format/u_format.h"
|
|
#include "util/u_hash_table.h"
|
|
#include "util/u_screen.h"
|
|
#include "util/u_transfer_helper.h"
|
|
#include "util/ralloc.h"
|
|
#include "util/xmlconfig.h"
|
|
|
|
#include <xf86drm.h>
|
|
#include "v3d_screen.h"
|
|
#include "v3d_context.h"
|
|
#include "v3d_resource.h"
|
|
#include "compiler/v3d_compiler.h"
|
|
#include "drm-uapi/drm_fourcc.h"
|
|
|
|
static const char *
|
|
v3d_screen_get_name(struct pipe_screen *pscreen)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
if (!screen->name) {
|
|
screen->name = ralloc_asprintf(screen,
|
|
"V3D %d.%d",
|
|
screen->devinfo.ver / 10,
|
|
screen->devinfo.ver % 10);
|
|
}
|
|
|
|
return screen->name;
|
|
}
|
|
|
|
static const char *
|
|
v3d_screen_get_vendor(struct pipe_screen *pscreen)
|
|
{
|
|
return "Broadcom";
|
|
}
|
|
|
|
static void
|
|
v3d_screen_destroy(struct pipe_screen *pscreen)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
_mesa_hash_table_destroy(screen->bo_handles, NULL);
|
|
v3d_bufmgr_destroy(pscreen);
|
|
slab_destroy_parent(&screen->transfer_pool);
|
|
if (screen->ro)
|
|
screen->ro->destroy(screen->ro);
|
|
|
|
if (using_v3d_simulator)
|
|
v3d_simulator_destroy(screen->sim_file);
|
|
|
|
v3d_compiler_free(screen->compiler);
|
|
|
|
#ifdef ENABLE_SHADER_CACHE
|
|
if (screen->disk_cache)
|
|
disk_cache_destroy(screen->disk_cache);
|
|
#endif
|
|
|
|
u_transfer_helper_destroy(pscreen->transfer_helper);
|
|
|
|
close(screen->fd);
|
|
ralloc_free(pscreen);
|
|
}
|
|
|
|
static bool
|
|
v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
|
|
{
|
|
struct drm_v3d_get_param p = {
|
|
.param = feature,
|
|
};
|
|
int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
|
|
|
|
if (ret != 0)
|
|
return false;
|
|
|
|
return p.value;
|
|
}
|
|
|
|
static int
|
|
v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
switch (param) {
|
|
/* Supported features (boolean caps). */
|
|
case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
|
|
case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
|
|
case PIPE_CAP_NPOT_TEXTURES:
|
|
case PIPE_CAP_BLEND_EQUATION_SEPARATE:
|
|
case PIPE_CAP_TEXTURE_MULTISAMPLE:
|
|
case PIPE_CAP_TEXTURE_SWIZZLE:
|
|
case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
|
|
case PIPE_CAP_START_INSTANCE:
|
|
case PIPE_CAP_VS_INSTANCEID:
|
|
case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
|
|
case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
|
|
case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
|
|
case PIPE_CAP_EMULATE_NONFIXED_PRIMITIVE_RESTART:
|
|
case PIPE_CAP_PRIMITIVE_RESTART:
|
|
case PIPE_CAP_OCCLUSION_QUERY:
|
|
case PIPE_CAP_POINT_SPRITE:
|
|
case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
|
|
case PIPE_CAP_DRAW_INDIRECT:
|
|
case PIPE_CAP_MULTI_DRAW_INDIRECT:
|
|
case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
|
|
case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
|
|
case PIPE_CAP_SHADER_CAN_READ_OUTPUTS:
|
|
case PIPE_CAP_SHADER_PACK_HALF_FLOAT:
|
|
case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
|
|
case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
|
|
case PIPE_CAP_FS_FACE_IS_INTEGER_SYSVAL:
|
|
case PIPE_CAP_TGSI_TEXCOORD:
|
|
case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
|
|
case PIPE_CAP_SAMPLER_VIEW_TARGET:
|
|
case PIPE_CAP_ANISOTROPIC_FILTER:
|
|
case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
|
|
case PIPE_CAP_INDEP_BLEND_FUNC:
|
|
return 1;
|
|
|
|
case PIPE_CAP_POLYGON_OFFSET_CLAMP:
|
|
return screen->devinfo.ver >= 41;
|
|
|
|
case PIPE_CAP_TEXTURE_QUERY_LOD:
|
|
return screen->devinfo.ver >= 42;
|
|
break;
|
|
|
|
case PIPE_CAP_PACKED_UNIFORMS:
|
|
/* We can't enable this flag, because it results in load_ubo
|
|
* intrinsics across a 16b boundary, but v3d's TMU general
|
|
* memory accesses wrap on 16b boundaries.
|
|
*/
|
|
return 0;
|
|
|
|
case PIPE_CAP_NIR_IMAGES_AS_DEREF:
|
|
return 0;
|
|
|
|
case PIPE_CAP_TEXTURE_TRANSFER_MODES:
|
|
/* XXX perf: we don't want to emit these extra blits for
|
|
* glReadPixels(), since we still have to do an uncached read
|
|
* from the GPU of the result after waiting for the TFU blit
|
|
* to happen. However, disabling this introduces instability
|
|
* in
|
|
* dEQP-GLES31.functional.image_load_store.early_fragment_tests.*
|
|
* and corruption in chromium's rendering.
|
|
*/
|
|
return PIPE_TEXTURE_TRANSFER_BLIT;
|
|
|
|
case PIPE_CAP_COMPUTE:
|
|
return screen->has_csd && screen->devinfo.ver >= 41;
|
|
|
|
case PIPE_CAP_GENERATE_MIPMAP:
|
|
return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
|
|
|
|
case PIPE_CAP_INDEP_BLEND_ENABLE:
|
|
return screen->devinfo.ver >= 40;
|
|
|
|
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
|
|
return V3D_NON_COHERENT_ATOM_SIZE;
|
|
|
|
case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
|
|
if (screen->devinfo.ver < 40)
|
|
return 0;
|
|
return 4;
|
|
|
|
case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
|
|
if (screen->has_cache_flush)
|
|
return 4;
|
|
else
|
|
return 0; /* Disables shader storage */
|
|
|
|
case PIPE_CAP_GLSL_FEATURE_LEVEL:
|
|
return 330;
|
|
|
|
case PIPE_CAP_ESSL_FEATURE_LEVEL:
|
|
return 310;
|
|
|
|
case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
|
|
return 140;
|
|
|
|
case PIPE_CAP_FS_COORD_ORIGIN_UPPER_LEFT:
|
|
return 1;
|
|
case PIPE_CAP_FS_COORD_ORIGIN_LOWER_LEFT:
|
|
return 0;
|
|
case PIPE_CAP_FS_COORD_PIXEL_CENTER_INTEGER:
|
|
if (screen->devinfo.ver >= 40)
|
|
return 0;
|
|
else
|
|
return 1;
|
|
case PIPE_CAP_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
|
|
if (screen->devinfo.ver >= 40)
|
|
return 1;
|
|
else
|
|
return 0;
|
|
|
|
case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
|
|
case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
|
|
case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
|
|
return 1;
|
|
|
|
case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
|
|
return 4;
|
|
|
|
case PIPE_CAP_MAX_VARYINGS:
|
|
return V3D_MAX_FS_INPUTS / 4;
|
|
|
|
/* Texturing. */
|
|
case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
|
|
if (screen->devinfo.ver < 40)
|
|
return 2048;
|
|
else if (screen->nonmsaa_texture_size_limit)
|
|
return 7680;
|
|
else
|
|
return V3D_MAX_IMAGE_DIMENSION;
|
|
case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
|
|
case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
|
|
if (screen->devinfo.ver < 40)
|
|
return 12;
|
|
else
|
|
return V3D_MAX_MIP_LEVELS;
|
|
case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
|
|
return V3D_MAX_ARRAY_LAYERS;
|
|
|
|
/* Render targets. */
|
|
case PIPE_CAP_MAX_RENDER_TARGETS:
|
|
return 4;
|
|
|
|
case PIPE_CAP_VENDOR_ID:
|
|
return 0x14E4;
|
|
case PIPE_CAP_ACCELERATED:
|
|
return 1;
|
|
case PIPE_CAP_VIDEO_MEMORY: {
|
|
uint64_t system_memory;
|
|
|
|
if (!os_get_total_physical_memory(&system_memory))
|
|
return 0;
|
|
|
|
return (int)(system_memory >> 20);
|
|
}
|
|
case PIPE_CAP_UMA:
|
|
return 1;
|
|
|
|
case PIPE_CAP_ALPHA_TEST:
|
|
case PIPE_CAP_FLATSHADE:
|
|
case PIPE_CAP_TWO_SIDED_COLOR:
|
|
case PIPE_CAP_VERTEX_COLOR_CLAMPED:
|
|
case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
|
|
case PIPE_CAP_GL_CLAMP:
|
|
return 0;
|
|
|
|
/* Geometry shaders */
|
|
case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
|
|
/* Minimum required by GLES 3.2 */
|
|
return 1024;
|
|
case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
|
|
/* MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS / 4 */
|
|
return 256;
|
|
case PIPE_CAP_MAX_GS_INVOCATIONS:
|
|
return 32;
|
|
|
|
case PIPE_CAP_SUPPORTED_PRIM_MODES:
|
|
case PIPE_CAP_SUPPORTED_PRIM_MODES_WITH_RESTART:
|
|
return screen->prim_types;
|
|
|
|
case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
|
|
return true;
|
|
|
|
case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
|
|
return 256;
|
|
|
|
case PIPE_CAP_IMAGE_STORE_FORMATTED:
|
|
return false;
|
|
|
|
default:
|
|
return u_pipe_screen_get_param_defaults(pscreen, param);
|
|
}
|
|
}
|
|
|
|
static float
|
|
v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
|
|
{
|
|
switch (param) {
|
|
case PIPE_CAPF_MIN_LINE_WIDTH:
|
|
case PIPE_CAPF_MIN_LINE_WIDTH_AA:
|
|
case PIPE_CAPF_MIN_POINT_SIZE:
|
|
case PIPE_CAPF_MIN_POINT_SIZE_AA:
|
|
return 1;
|
|
|
|
case PIPE_CAPF_POINT_SIZE_GRANULARITY:
|
|
case PIPE_CAPF_LINE_WIDTH_GRANULARITY:
|
|
return 0.1;
|
|
|
|
case PIPE_CAPF_MAX_LINE_WIDTH:
|
|
case PIPE_CAPF_MAX_LINE_WIDTH_AA:
|
|
return V3D_MAX_LINE_WIDTH;
|
|
|
|
case PIPE_CAPF_MAX_POINT_SIZE:
|
|
case PIPE_CAPF_MAX_POINT_SIZE_AA:
|
|
return V3D_MAX_POINT_SIZE;
|
|
|
|
case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
|
|
return 16.0f;
|
|
case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
|
|
return 16.0f;
|
|
|
|
case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
|
|
case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
|
|
case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
|
|
return 0.0f;
|
|
default:
|
|
fprintf(stderr, "unknown paramf %d\n", param);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static int
|
|
v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
|
|
enum pipe_shader_cap param)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
switch (shader) {
|
|
case PIPE_SHADER_VERTEX:
|
|
case PIPE_SHADER_FRAGMENT:
|
|
break;
|
|
case PIPE_SHADER_COMPUTE:
|
|
if (!screen->has_csd)
|
|
return 0;
|
|
break;
|
|
case PIPE_SHADER_GEOMETRY:
|
|
if (screen->devinfo.ver < 41)
|
|
return 0;
|
|
break;
|
|
default:
|
|
return 0;
|
|
}
|
|
|
|
/* this is probably not totally correct.. but it's a start: */
|
|
switch (param) {
|
|
case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
|
|
case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
|
|
case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
|
|
case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
|
|
return 16384;
|
|
|
|
case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
|
|
return UINT_MAX;
|
|
|
|
case PIPE_SHADER_CAP_MAX_INPUTS:
|
|
switch (shader) {
|
|
case PIPE_SHADER_VERTEX:
|
|
return V3D_MAX_VS_INPUTS / 4;
|
|
case PIPE_SHADER_GEOMETRY:
|
|
return V3D_MAX_GS_INPUTS / 4;
|
|
case PIPE_SHADER_FRAGMENT:
|
|
return V3D_MAX_FS_INPUTS / 4;
|
|
default:
|
|
return 0;
|
|
};
|
|
case PIPE_SHADER_CAP_MAX_OUTPUTS:
|
|
if (shader == PIPE_SHADER_FRAGMENT)
|
|
return 4;
|
|
else
|
|
return V3D_MAX_FS_INPUTS / 4;
|
|
case PIPE_SHADER_CAP_MAX_TEMPS:
|
|
return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
|
|
case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE:
|
|
/* Note: Limited by the offset size in
|
|
* v3d_unit_data_create().
|
|
*/
|
|
return 16 * 1024 * sizeof(float);
|
|
case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
|
|
return 16;
|
|
case PIPE_SHADER_CAP_CONT_SUPPORTED:
|
|
return 0;
|
|
case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
|
|
/* We don't currently support this in the backend, but that is
|
|
* okay because our NIR compiler sets the option
|
|
* lower_all_io_to_temps, which will eliminate indirect
|
|
* indexing on all input/output variables by translating it to
|
|
* indirect indexing on temporary variables instead, which we
|
|
* will then lower to scratch. We prefer this over setting this
|
|
* to 0, which would cause if-ladder injection to eliminate
|
|
* indirect indexing on inputs.
|
|
*/
|
|
return 1;
|
|
case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
|
|
return 1;
|
|
case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
|
|
return 1;
|
|
case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
|
|
return 1;
|
|
case PIPE_SHADER_CAP_SUBROUTINES:
|
|
return 0;
|
|
case PIPE_SHADER_CAP_INTEGERS:
|
|
return 1;
|
|
case PIPE_SHADER_CAP_FP16:
|
|
case PIPE_SHADER_CAP_FP16_DERIVATIVES:
|
|
case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
|
|
case PIPE_SHADER_CAP_INT16:
|
|
case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
|
|
case PIPE_SHADER_CAP_DROUND_SUPPORTED:
|
|
case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
|
|
case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
|
|
case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
|
|
case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
|
|
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
|
|
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
|
|
return 0;
|
|
case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
|
|
case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
|
|
return V3D_MAX_TEXTURE_SAMPLERS;
|
|
|
|
case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
|
|
if (screen->has_cache_flush) {
|
|
if (shader == PIPE_SHADER_VERTEX ||
|
|
shader == PIPE_SHADER_GEOMETRY) {
|
|
return 0;
|
|
}
|
|
return PIPE_MAX_SHADER_BUFFERS;
|
|
} else {
|
|
return 0;
|
|
}
|
|
|
|
case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
|
|
if (screen->has_cache_flush) {
|
|
if (screen->devinfo.ver < 41)
|
|
return 0;
|
|
else
|
|
return PIPE_MAX_SHADER_IMAGES;
|
|
} else {
|
|
return 0;
|
|
}
|
|
|
|
case PIPE_SHADER_CAP_PREFERRED_IR:
|
|
return PIPE_SHADER_IR_NIR;
|
|
case PIPE_SHADER_CAP_SUPPORTED_IRS:
|
|
return 1 << PIPE_SHADER_IR_NIR;
|
|
default:
|
|
fprintf(stderr, "unknown shader param %d\n", param);
|
|
return 0;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int
|
|
v3d_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type,
|
|
enum pipe_compute_cap param, void *ret)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
if (!screen->has_csd)
|
|
return 0;
|
|
|
|
#define RET(x) do { \
|
|
if (ret) \
|
|
memcpy(ret, x, sizeof(x)); \
|
|
return sizeof(x); \
|
|
} while (0)
|
|
|
|
switch (param) {
|
|
case PIPE_COMPUTE_CAP_ADDRESS_BITS:
|
|
RET((uint32_t []) { 32 });
|
|
break;
|
|
|
|
case PIPE_COMPUTE_CAP_IR_TARGET:
|
|
sprintf(ret, "v3d");
|
|
return strlen(ret);
|
|
|
|
case PIPE_COMPUTE_CAP_GRID_DIMENSION:
|
|
RET((uint64_t []) { 3 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
|
|
/* GL_MAX_COMPUTE_SHADER_WORK_GROUP_COUNT: The CSD has a
|
|
* 16-bit field for the number of workgroups in each
|
|
* dimension.
|
|
*/
|
|
RET(((uint64_t []) { 65535, 65535, 65535 }));
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
|
|
/* GL_MAX_COMPUTE_WORK_GROUP_SIZE */
|
|
RET(((uint64_t []) { 256, 256, 256 }));
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
|
|
case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
|
|
/* GL_MAX_COMPUTE_WORK_GROUP_INVOCATIONS: This is
|
|
* limited by WG_SIZE in the CSD.
|
|
*/
|
|
RET((uint64_t []) { 256 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
|
|
RET((uint64_t []) { 1024 * 1024 * 1024 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
|
|
/* GL_MAX_COMPUTE_SHARED_MEMORY_SIZE */
|
|
RET((uint64_t []) { 32768 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
|
|
case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
|
|
RET((uint64_t []) { 4096 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE: {
|
|
struct sysinfo si;
|
|
sysinfo(&si);
|
|
RET((uint64_t []) { si.totalram });
|
|
}
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
|
|
/* OpenCL only */
|
|
RET((uint32_t []) { 0 });
|
|
|
|
case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
|
|
RET((uint32_t []) { 1 });
|
|
|
|
case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
|
|
RET((uint32_t []) { 1 });
|
|
|
|
case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
|
|
RET((uint32_t []) { 16 });
|
|
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static bool
|
|
v3d_screen_is_format_supported(struct pipe_screen *pscreen,
|
|
enum pipe_format format,
|
|
enum pipe_texture_target target,
|
|
unsigned sample_count,
|
|
unsigned storage_sample_count,
|
|
unsigned usage)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
|
|
return false;
|
|
|
|
if (sample_count > 1 && sample_count != V3D_MAX_SAMPLES)
|
|
return false;
|
|
|
|
if (target >= PIPE_MAX_TEXTURE_TYPES) {
|
|
return false;
|
|
}
|
|
|
|
if (usage & PIPE_BIND_VERTEX_BUFFER) {
|
|
switch (format) {
|
|
case PIPE_FORMAT_R32G32B32A32_FLOAT:
|
|
case PIPE_FORMAT_R32G32B32_FLOAT:
|
|
case PIPE_FORMAT_R32G32_FLOAT:
|
|
case PIPE_FORMAT_R32_FLOAT:
|
|
case PIPE_FORMAT_R32G32B32A32_SNORM:
|
|
case PIPE_FORMAT_R32G32B32_SNORM:
|
|
case PIPE_FORMAT_R32G32_SNORM:
|
|
case PIPE_FORMAT_R32_SNORM:
|
|
case PIPE_FORMAT_R32G32B32A32_SSCALED:
|
|
case PIPE_FORMAT_R32G32B32_SSCALED:
|
|
case PIPE_FORMAT_R32G32_SSCALED:
|
|
case PIPE_FORMAT_R32_SSCALED:
|
|
case PIPE_FORMAT_R16G16B16A16_UNORM:
|
|
case PIPE_FORMAT_R16G16B16_UNORM:
|
|
case PIPE_FORMAT_R16G16_UNORM:
|
|
case PIPE_FORMAT_R16_UNORM:
|
|
case PIPE_FORMAT_R16G16B16A16_SNORM:
|
|
case PIPE_FORMAT_R16G16B16_SNORM:
|
|
case PIPE_FORMAT_R16G16_SNORM:
|
|
case PIPE_FORMAT_R16_SNORM:
|
|
case PIPE_FORMAT_R16G16B16A16_USCALED:
|
|
case PIPE_FORMAT_R16G16B16_USCALED:
|
|
case PIPE_FORMAT_R16G16_USCALED:
|
|
case PIPE_FORMAT_R16_USCALED:
|
|
case PIPE_FORMAT_R16G16B16A16_SSCALED:
|
|
case PIPE_FORMAT_R16G16B16_SSCALED:
|
|
case PIPE_FORMAT_R16G16_SSCALED:
|
|
case PIPE_FORMAT_R16_SSCALED:
|
|
case PIPE_FORMAT_B8G8R8A8_UNORM:
|
|
case PIPE_FORMAT_R8G8B8A8_UNORM:
|
|
case PIPE_FORMAT_R8G8B8_UNORM:
|
|
case PIPE_FORMAT_R8G8_UNORM:
|
|
case PIPE_FORMAT_R8_UNORM:
|
|
case PIPE_FORMAT_R8G8B8A8_SNORM:
|
|
case PIPE_FORMAT_R8G8B8_SNORM:
|
|
case PIPE_FORMAT_R8G8_SNORM:
|
|
case PIPE_FORMAT_R8_SNORM:
|
|
case PIPE_FORMAT_R8G8B8A8_USCALED:
|
|
case PIPE_FORMAT_R8G8B8_USCALED:
|
|
case PIPE_FORMAT_R8G8_USCALED:
|
|
case PIPE_FORMAT_R8_USCALED:
|
|
case PIPE_FORMAT_R8G8B8A8_SSCALED:
|
|
case PIPE_FORMAT_R8G8B8_SSCALED:
|
|
case PIPE_FORMAT_R8G8_SSCALED:
|
|
case PIPE_FORMAT_R8_SSCALED:
|
|
case PIPE_FORMAT_R10G10B10A2_UNORM:
|
|
case PIPE_FORMAT_B10G10R10A2_UNORM:
|
|
case PIPE_FORMAT_R10G10B10A2_SNORM:
|
|
case PIPE_FORMAT_B10G10R10A2_SNORM:
|
|
case PIPE_FORMAT_R10G10B10A2_USCALED:
|
|
case PIPE_FORMAT_B10G10R10A2_USCALED:
|
|
case PIPE_FORMAT_R10G10B10A2_SSCALED:
|
|
case PIPE_FORMAT_B10G10R10A2_SSCALED:
|
|
break;
|
|
default:
|
|
return false;
|
|
}
|
|
}
|
|
|
|
/* FORMAT_NONE gets allowed for ARB_framebuffer_no_attachments's probe
|
|
* of FRAMEBUFFER_MAX_SAMPLES
|
|
*/
|
|
if ((usage & PIPE_BIND_RENDER_TARGET) &&
|
|
format != PIPE_FORMAT_NONE &&
|
|
!v3d_rt_format_supported(&screen->devinfo, format)) {
|
|
return false;
|
|
}
|
|
|
|
if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
|
|
!v3d_tex_format_supported(&screen->devinfo, format)) {
|
|
return false;
|
|
}
|
|
|
|
if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
|
|
!(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
|
|
format == PIPE_FORMAT_X8Z24_UNORM ||
|
|
format == PIPE_FORMAT_Z16_UNORM ||
|
|
format == PIPE_FORMAT_Z32_FLOAT ||
|
|
format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
|
|
return false;
|
|
}
|
|
|
|
if ((usage & PIPE_BIND_INDEX_BUFFER) &&
|
|
!(format == PIPE_FORMAT_R8_UINT ||
|
|
format == PIPE_FORMAT_R16_UINT ||
|
|
format == PIPE_FORMAT_R32_UINT)) {
|
|
return false;
|
|
}
|
|
|
|
if (usage & PIPE_BIND_SHADER_IMAGE) {
|
|
switch (format) {
|
|
/* FIXME: maybe we can implement a swizzle-on-writes to add
|
|
* support for BGRA-alike formats.
|
|
*/
|
|
case PIPE_FORMAT_A4B4G4R4_UNORM:
|
|
case PIPE_FORMAT_A1B5G5R5_UNORM:
|
|
case PIPE_FORMAT_B5G6R5_UNORM:
|
|
case PIPE_FORMAT_B8G8R8A8_UNORM:
|
|
case PIPE_FORMAT_X8Z24_UNORM:
|
|
case PIPE_FORMAT_Z16_UNORM:
|
|
return false;
|
|
default:
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static const nir_shader_compiler_options v3d_nir_options = {
|
|
.lower_uadd_sat = true,
|
|
.lower_usub_sat = true,
|
|
.lower_iadd_sat = true,
|
|
.lower_all_io_to_temps = true,
|
|
.lower_extract_byte = true,
|
|
.lower_extract_word = true,
|
|
.lower_insert_byte = true,
|
|
.lower_insert_word = true,
|
|
.lower_bitfield_insert_to_shifts = true,
|
|
.lower_bitfield_extract_to_shifts = true,
|
|
.lower_bitfield_reverse = true,
|
|
.lower_bit_count = true,
|
|
.lower_cs_local_id_to_index = true,
|
|
.lower_ffract = true,
|
|
.lower_fmod = true,
|
|
.lower_pack_unorm_2x16 = true,
|
|
.lower_pack_snorm_2x16 = true,
|
|
.lower_pack_unorm_4x8 = true,
|
|
.lower_pack_snorm_4x8 = true,
|
|
.lower_unpack_unorm_4x8 = true,
|
|
.lower_unpack_snorm_4x8 = true,
|
|
.lower_pack_half_2x16 = true,
|
|
.lower_unpack_half_2x16 = true,
|
|
.lower_pack_32_2x16 = true,
|
|
.lower_pack_32_2x16_split = true,
|
|
.lower_unpack_32_2x16_split = true,
|
|
.lower_fdiv = true,
|
|
.lower_find_lsb = true,
|
|
.lower_ffma16 = true,
|
|
.lower_ffma32 = true,
|
|
.lower_ffma64 = true,
|
|
.lower_flrp32 = true,
|
|
.lower_fpow = true,
|
|
.lower_fsat = true,
|
|
.lower_fsqrt = true,
|
|
.lower_ifind_msb = true,
|
|
.lower_isign = true,
|
|
.lower_ldexp = true,
|
|
.lower_mul_high = true,
|
|
.lower_wpos_pntc = true,
|
|
.lower_rotate = true,
|
|
.lower_to_scalar = true,
|
|
.lower_int64_options = nir_lower_imul_2x32_64,
|
|
.has_fsub = true,
|
|
.has_isub = true,
|
|
.divergence_analysis_options =
|
|
nir_divergence_multiple_workgroup_per_compute_subgroup,
|
|
/* This will enable loop unrolling in the state tracker so we won't
|
|
* be able to selectively disable it in backend if it leads to
|
|
* lower thread counts or TMU spills. Choose a conservative maximum to
|
|
* limit register pressure impact.
|
|
*/
|
|
.max_unroll_iterations = 16,
|
|
.force_indirect_unrolling_sampler = true,
|
|
};
|
|
|
|
static const void *
|
|
v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
|
|
enum pipe_shader_ir ir, unsigned shader)
|
|
{
|
|
return &v3d_nir_options;
|
|
}
|
|
|
|
static const uint64_t v3d_available_modifiers[] = {
|
|
DRM_FORMAT_MOD_BROADCOM_UIF,
|
|
DRM_FORMAT_MOD_LINEAR,
|
|
DRM_FORMAT_MOD_BROADCOM_SAND128,
|
|
};
|
|
|
|
static void
|
|
v3d_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen,
|
|
enum pipe_format format, int max,
|
|
uint64_t *modifiers,
|
|
unsigned int *external_only,
|
|
int *count)
|
|
{
|
|
int i;
|
|
int num_modifiers = ARRAY_SIZE(v3d_available_modifiers);
|
|
|
|
/* Expose DRM_FORMAT_MOD_BROADCOM_SAND128 only for PIPE_FORMAT_NV12 */
|
|
if (format != PIPE_FORMAT_NV12)
|
|
num_modifiers--;
|
|
|
|
if (!modifiers) {
|
|
*count = num_modifiers;
|
|
return;
|
|
}
|
|
|
|
*count = MIN2(max, num_modifiers);
|
|
for (i = 0; i < *count; i++) {
|
|
modifiers[i] = v3d_available_modifiers[i];
|
|
if (external_only)
|
|
external_only[i] = util_format_is_yuv(format);
|
|
}
|
|
}
|
|
|
|
static bool
|
|
v3d_screen_is_dmabuf_modifier_supported(struct pipe_screen *pscreen,
|
|
uint64_t modifier,
|
|
enum pipe_format format,
|
|
bool *external_only)
|
|
{
|
|
int i;
|
|
bool is_sand_col128 = (format == PIPE_FORMAT_NV12) &&
|
|
(fourcc_mod_broadcom_mod(modifier) == DRM_FORMAT_MOD_BROADCOM_SAND128);
|
|
|
|
if (is_sand_col128) {
|
|
if (external_only)
|
|
*external_only = true;
|
|
return true;
|
|
}
|
|
|
|
/* We don't want to generally allow DRM_FORMAT_MOD_BROADCOM_SAND128
|
|
* modifier, that is the last v3d_available_modifiers. We only accept
|
|
* it in the case of having a PIPE_FORMAT_NV12.
|
|
*/
|
|
assert(v3d_available_modifiers[ARRAY_SIZE(v3d_available_modifiers) - 1] ==
|
|
DRM_FORMAT_MOD_BROADCOM_SAND128);
|
|
for (i = 0; i < ARRAY_SIZE(v3d_available_modifiers) - 1; i++) {
|
|
if (v3d_available_modifiers[i] == modifier) {
|
|
if (external_only)
|
|
*external_only = util_format_is_yuv(format);
|
|
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
static enum pipe_format
|
|
v3d_screen_get_compatible_tlb_format(struct pipe_screen *screen,
|
|
enum pipe_format format)
|
|
{
|
|
switch (format) {
|
|
case PIPE_FORMAT_R16G16_UNORM:
|
|
return PIPE_FORMAT_R16G16_UINT;
|
|
default:
|
|
return format;
|
|
}
|
|
}
|
|
|
|
static struct disk_cache *
|
|
v3d_screen_get_disk_shader_cache(struct pipe_screen *pscreen)
|
|
{
|
|
struct v3d_screen *screen = v3d_screen(pscreen);
|
|
|
|
return screen->disk_cache;
|
|
}
|
|
|
|
struct pipe_screen *
|
|
v3d_screen_create(int fd, const struct pipe_screen_config *config,
|
|
struct renderonly *ro)
|
|
{
|
|
struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
|
|
struct pipe_screen *pscreen;
|
|
|
|
pscreen = &screen->base;
|
|
|
|
pscreen->destroy = v3d_screen_destroy;
|
|
pscreen->get_param = v3d_screen_get_param;
|
|
pscreen->get_paramf = v3d_screen_get_paramf;
|
|
pscreen->get_shader_param = v3d_screen_get_shader_param;
|
|
pscreen->get_compute_param = v3d_get_compute_param;
|
|
pscreen->context_create = v3d_context_create;
|
|
pscreen->is_format_supported = v3d_screen_is_format_supported;
|
|
pscreen->get_canonical_format = v3d_screen_get_compatible_tlb_format;
|
|
|
|
screen->fd = fd;
|
|
screen->ro = ro;
|
|
|
|
list_inithead(&screen->bo_cache.time_list);
|
|
(void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
|
|
screen->bo_handles = util_hash_table_create_ptr_keys();
|
|
|
|
#if defined(USE_V3D_SIMULATOR)
|
|
screen->sim_file = v3d_simulator_init(screen->fd);
|
|
#endif
|
|
|
|
if (!v3d_get_device_info(screen->fd, &screen->devinfo, &v3d_ioctl))
|
|
goto fail;
|
|
|
|
driParseConfigFiles(config->options, config->options_info, 0, "v3d",
|
|
NULL, NULL, NULL, 0, NULL, 0);
|
|
|
|
/* We have to driCheckOption for the simulator mode to not assertion
|
|
* fail on not having our XML config.
|
|
*/
|
|
const char *nonmsaa_name = "v3d_nonmsaa_texture_size_limit";
|
|
screen->nonmsaa_texture_size_limit =
|
|
driCheckOption(config->options, nonmsaa_name, DRI_BOOL) &&
|
|
driQueryOptionb(config->options, nonmsaa_name);
|
|
|
|
slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
|
|
|
|
screen->has_csd = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CSD);
|
|
screen->has_cache_flush =
|
|
v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CACHE_FLUSH);
|
|
screen->has_perfmon = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_PERFMON);
|
|
|
|
v3d_fence_init(screen);
|
|
|
|
v3d_process_debug_variable();
|
|
|
|
v3d_resource_screen_init(pscreen);
|
|
|
|
screen->compiler = v3d_compiler_init(&screen->devinfo, 0);
|
|
|
|
#ifdef ENABLE_SHADER_CACHE
|
|
v3d_disk_cache_init(screen);
|
|
#endif
|
|
|
|
pscreen->get_name = v3d_screen_get_name;
|
|
pscreen->get_vendor = v3d_screen_get_vendor;
|
|
pscreen->get_device_vendor = v3d_screen_get_vendor;
|
|
pscreen->get_compiler_options = v3d_screen_get_compiler_options;
|
|
pscreen->get_disk_shader_cache = v3d_screen_get_disk_shader_cache;
|
|
pscreen->query_dmabuf_modifiers = v3d_screen_query_dmabuf_modifiers;
|
|
pscreen->is_dmabuf_modifier_supported =
|
|
v3d_screen_is_dmabuf_modifier_supported;
|
|
|
|
if (screen->has_perfmon) {
|
|
pscreen->get_driver_query_group_info = v3d_get_driver_query_group_info;
|
|
pscreen->get_driver_query_info = v3d_get_driver_query_info;
|
|
}
|
|
|
|
/* Generate the bitmask of supported draw primitives. */
|
|
screen->prim_types = BITFIELD_BIT(PIPE_PRIM_POINTS) |
|
|
BITFIELD_BIT(PIPE_PRIM_LINES) |
|
|
BITFIELD_BIT(PIPE_PRIM_LINE_LOOP) |
|
|
BITFIELD_BIT(PIPE_PRIM_LINE_STRIP) |
|
|
BITFIELD_BIT(PIPE_PRIM_TRIANGLES) |
|
|
BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP) |
|
|
BITFIELD_BIT(PIPE_PRIM_TRIANGLE_FAN) |
|
|
BITFIELD_BIT(PIPE_PRIM_LINES_ADJACENCY) |
|
|
BITFIELD_BIT(PIPE_PRIM_LINE_STRIP_ADJACENCY) |
|
|
BITFIELD_BIT(PIPE_PRIM_TRIANGLES_ADJACENCY) |
|
|
BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP_ADJACENCY);
|
|
|
|
return pscreen;
|
|
|
|
fail:
|
|
close(fd);
|
|
ralloc_free(pscreen);
|
|
return NULL;
|
|
}
|