337 lines
11 KiB
C
337 lines
11 KiB
C
/*
|
|
* Copyright © 2017 Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included
|
|
* in all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <time.h>
|
|
#include "pipe/p_defines.h"
|
|
#include "pipe/p_state.h"
|
|
#include "util/ralloc.h"
|
|
#include "util/u_inlines.h"
|
|
#include "util/format/u_format.h"
|
|
#include "util/u_upload_mgr.h"
|
|
#include "drm-uapi/i915_drm.h"
|
|
#include "crocus_context.h"
|
|
#include "crocus_resource.h"
|
|
#include "crocus_screen.h"
|
|
#include "common/intel_defines.h"
|
|
#include "common/intel_sample_positions.h"
|
|
|
|
/**
|
|
* The pipe->set_debug_callback() driver hook.
|
|
*/
|
|
static void
|
|
crocus_set_debug_callback(struct pipe_context *ctx,
|
|
const struct pipe_debug_callback *cb)
|
|
{
|
|
struct crocus_context *ice = (struct crocus_context *)ctx;
|
|
|
|
if (cb)
|
|
ice->dbg = *cb;
|
|
else
|
|
memset(&ice->dbg, 0, sizeof(ice->dbg));
|
|
}
|
|
|
|
static bool
|
|
crocus_init_identifier_bo(struct crocus_context *ice)
|
|
{
|
|
void *bo_map;
|
|
|
|
bo_map = crocus_bo_map(NULL, ice->workaround_bo, MAP_READ | MAP_WRITE);
|
|
if (!bo_map)
|
|
return false;
|
|
|
|
ice->workaround_bo->kflags |= EXEC_OBJECT_CAPTURE;
|
|
ice->workaround_offset = ALIGN(
|
|
intel_debug_write_identifiers(bo_map, 4096, "Crocus") + 8, 8);
|
|
|
|
crocus_bo_unmap(ice->workaround_bo);
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* Called from the batch module when it detects a GPU hang.
|
|
*
|
|
* In this case, we've lost our GEM context, and can't rely on any existing
|
|
* state on the GPU. We must mark everything dirty and wipe away any saved
|
|
* assumptions about the last known state of the GPU.
|
|
*/
|
|
void
|
|
crocus_lost_context_state(struct crocus_batch *batch)
|
|
{
|
|
/* The batch module doesn't have an crocus_context, because we want to
|
|
* avoid introducing lots of layering violations. Unfortunately, here
|
|
* we do need to inform the context of batch catastrophe. We know the
|
|
* batch is one of our context's, so hackily claw our way back.
|
|
*/
|
|
struct crocus_context *ice = batch->ice;
|
|
struct crocus_screen *screen = batch->screen;
|
|
if (batch->name == CROCUS_BATCH_RENDER) {
|
|
screen->vtbl.init_render_context(batch);
|
|
} else if (batch->name == CROCUS_BATCH_COMPUTE) {
|
|
screen->vtbl.init_compute_context(batch);
|
|
} else {
|
|
unreachable("unhandled batch reset");
|
|
}
|
|
|
|
ice->state.dirty = ~0ull;
|
|
memset(ice->state.last_grid, 0, sizeof(ice->state.last_grid));
|
|
batch->state_base_address_emitted = false;
|
|
screen->vtbl.lost_genx_state(ice, batch);
|
|
}
|
|
|
|
static enum pipe_reset_status
|
|
crocus_get_device_reset_status(struct pipe_context *ctx)
|
|
{
|
|
struct crocus_context *ice = (struct crocus_context *)ctx;
|
|
|
|
enum pipe_reset_status worst_reset = PIPE_NO_RESET;
|
|
|
|
/* Check the reset status of each batch's hardware context, and take the
|
|
* worst status (if one was guilty, proclaim guilt).
|
|
*/
|
|
for (int i = 0; i < ice->batch_count; i++) {
|
|
/* This will also recreate the hardware contexts as necessary, so any
|
|
* future queries will show no resets. We only want to report once.
|
|
*/
|
|
enum pipe_reset_status batch_reset =
|
|
crocus_batch_check_for_reset(&ice->batches[i]);
|
|
|
|
if (batch_reset == PIPE_NO_RESET)
|
|
continue;
|
|
|
|
if (worst_reset == PIPE_NO_RESET) {
|
|
worst_reset = batch_reset;
|
|
} else {
|
|
/* GUILTY < INNOCENT < UNKNOWN */
|
|
worst_reset = MIN2(worst_reset, batch_reset);
|
|
}
|
|
}
|
|
|
|
if (worst_reset != PIPE_NO_RESET && ice->reset.reset)
|
|
ice->reset.reset(ice->reset.data, worst_reset);
|
|
|
|
return worst_reset;
|
|
}
|
|
|
|
static void
|
|
crocus_set_device_reset_callback(struct pipe_context *ctx,
|
|
const struct pipe_device_reset_callback *cb)
|
|
{
|
|
struct crocus_context *ice = (struct crocus_context *)ctx;
|
|
|
|
if (cb)
|
|
ice->reset = *cb;
|
|
else
|
|
memset(&ice->reset, 0, sizeof(ice->reset));
|
|
}
|
|
|
|
static void
|
|
crocus_get_sample_position(struct pipe_context *ctx,
|
|
unsigned sample_count,
|
|
unsigned sample_index,
|
|
float *out_value)
|
|
{
|
|
union {
|
|
struct {
|
|
float x[16];
|
|
float y[16];
|
|
} a;
|
|
struct {
|
|
float _0XOffset, _1XOffset, _2XOffset, _3XOffset,
|
|
_4XOffset, _5XOffset, _6XOffset, _7XOffset,
|
|
_8XOffset, _9XOffset, _10XOffset, _11XOffset,
|
|
_12XOffset, _13XOffset, _14XOffset, _15XOffset;
|
|
float _0YOffset, _1YOffset, _2YOffset, _3YOffset,
|
|
_4YOffset, _5YOffset, _6YOffset, _7YOffset,
|
|
_8YOffset, _9YOffset, _10YOffset, _11YOffset,
|
|
_12YOffset, _13YOffset, _14YOffset, _15YOffset;
|
|
} v;
|
|
} u;
|
|
switch (sample_count) {
|
|
case 1: INTEL_SAMPLE_POS_1X(u.v._); break;
|
|
case 2: INTEL_SAMPLE_POS_2X(u.v._); break;
|
|
case 4: INTEL_SAMPLE_POS_4X(u.v._); break;
|
|
case 8: INTEL_SAMPLE_POS_8X(u.v._); break;
|
|
case 16: INTEL_SAMPLE_POS_16X(u.v._); break;
|
|
default: unreachable("invalid sample count");
|
|
}
|
|
|
|
out_value[0] = u.a.x[sample_index];
|
|
out_value[1] = u.a.y[sample_index];
|
|
}
|
|
|
|
/**
|
|
* Destroy a context, freeing any associated memory.
|
|
*/
|
|
static void
|
|
crocus_destroy_context(struct pipe_context *ctx)
|
|
{
|
|
struct crocus_context *ice = (struct crocus_context *)ctx;
|
|
struct crocus_screen *screen = (struct crocus_screen *)ctx->screen;
|
|
if (ctx->stream_uploader)
|
|
u_upload_destroy(ctx->stream_uploader);
|
|
|
|
if (ice->blitter)
|
|
util_blitter_destroy(ice->blitter);
|
|
screen->vtbl.destroy_state(ice);
|
|
crocus_destroy_program_cache(ice);
|
|
u_upload_destroy(ice->query_buffer_uploader);
|
|
|
|
crocus_bo_unreference(ice->workaround_bo);
|
|
|
|
slab_destroy_child(&ice->transfer_pool);
|
|
|
|
crocus_batch_free(&ice->batches[CROCUS_BATCH_RENDER]);
|
|
if (ice->batches[CROCUS_BATCH_COMPUTE].ice)
|
|
crocus_batch_free(&ice->batches[CROCUS_BATCH_COMPUTE]);
|
|
|
|
ralloc_free(ice);
|
|
}
|
|
|
|
#define genX_call(devinfo, func, ...) \
|
|
switch ((devinfo)->verx10) { \
|
|
case 75: \
|
|
gfx75_##func(__VA_ARGS__); \
|
|
break; \
|
|
case 70: \
|
|
gfx7_##func(__VA_ARGS__); \
|
|
break; \
|
|
case 60: \
|
|
gfx6_##func(__VA_ARGS__); \
|
|
break; \
|
|
case 50: \
|
|
gfx5_##func(__VA_ARGS__); \
|
|
break; \
|
|
case 45: \
|
|
gfx45_##func(__VA_ARGS__); \
|
|
break; \
|
|
case 40: \
|
|
gfx4_##func(__VA_ARGS__); \
|
|
break; \
|
|
default: \
|
|
unreachable("Unknown hardware generation"); \
|
|
}
|
|
|
|
/**
|
|
* Create a context.
|
|
*
|
|
* This is where each context begins.
|
|
*/
|
|
struct pipe_context *
|
|
crocus_create_context(struct pipe_screen *pscreen, void *priv, unsigned flags)
|
|
{
|
|
struct crocus_screen *screen = (struct crocus_screen*)pscreen;
|
|
const struct intel_device_info *devinfo = &screen->devinfo;
|
|
struct crocus_context *ice = rzalloc(NULL, struct crocus_context);
|
|
|
|
if (!ice)
|
|
return NULL;
|
|
|
|
struct pipe_context *ctx = &ice->ctx;
|
|
|
|
ctx->screen = pscreen;
|
|
ctx->priv = priv;
|
|
|
|
ctx->stream_uploader = u_upload_create_default(ctx);
|
|
if (!ctx->stream_uploader) {
|
|
free(ctx);
|
|
return NULL;
|
|
}
|
|
ctx->const_uploader = ctx->stream_uploader;
|
|
|
|
ctx->destroy = crocus_destroy_context;
|
|
ctx->set_debug_callback = crocus_set_debug_callback;
|
|
ctx->set_device_reset_callback = crocus_set_device_reset_callback;
|
|
ctx->get_device_reset_status = crocus_get_device_reset_status;
|
|
ctx->get_sample_position = crocus_get_sample_position;
|
|
|
|
ice->shaders.urb_size = devinfo->urb.size;
|
|
|
|
crocus_init_context_fence_functions(ctx);
|
|
crocus_init_blit_functions(ctx);
|
|
crocus_init_clear_functions(ctx);
|
|
crocus_init_program_functions(ctx);
|
|
crocus_init_resource_functions(ctx);
|
|
crocus_init_flush_functions(ctx);
|
|
|
|
crocus_init_program_cache(ice);
|
|
|
|
slab_create_child(&ice->transfer_pool, &screen->transfer_pool);
|
|
|
|
ice->query_buffer_uploader =
|
|
u_upload_create(ctx, 4096, PIPE_BIND_CUSTOM, PIPE_USAGE_STAGING,
|
|
0);
|
|
|
|
ice->workaround_bo =
|
|
crocus_bo_alloc(screen->bufmgr, "workaround", 4096);
|
|
if (!ice->workaround_bo)
|
|
return NULL;
|
|
|
|
if (!crocus_init_identifier_bo(ice))
|
|
return NULL;
|
|
|
|
genX_call(devinfo, init_state, ice);
|
|
genX_call(devinfo, init_blorp, ice);
|
|
genX_call(devinfo, init_query, ice);
|
|
|
|
ice->blitter = util_blitter_create(&ice->ctx);
|
|
if (ice->blitter == NULL)
|
|
return NULL;
|
|
int priority = 0;
|
|
if (flags & PIPE_CONTEXT_HIGH_PRIORITY)
|
|
priority = INTEL_CONTEXT_HIGH_PRIORITY;
|
|
if (flags & PIPE_CONTEXT_LOW_PRIORITY)
|
|
priority = INTEL_CONTEXT_LOW_PRIORITY;
|
|
|
|
ice->batch_count = devinfo->ver >= 7 ? CROCUS_BATCH_COUNT : 1;
|
|
for (int i = 0; i < ice->batch_count; i++) {
|
|
crocus_init_batch(ice, (enum crocus_batch_name) i,
|
|
priority);
|
|
}
|
|
|
|
ice->urb.size = devinfo->urb.size;
|
|
screen->vtbl.init_render_context(&ice->batches[CROCUS_BATCH_RENDER]);
|
|
if (ice->batch_count > 1)
|
|
screen->vtbl.init_compute_context(&ice->batches[CROCUS_BATCH_COMPUTE]);
|
|
|
|
return ctx;
|
|
}
|
|
|
|
bool
|
|
crocus_sw_check_cond_render(struct crocus_context *ice)
|
|
{
|
|
struct crocus_query *q = ice->condition.query;
|
|
union pipe_query_result result;
|
|
|
|
bool wait = ice->condition.mode == PIPE_RENDER_COND_WAIT ||
|
|
ice->condition.mode == PIPE_RENDER_COND_BY_REGION_WAIT;
|
|
if (!q)
|
|
return true;
|
|
|
|
bool ret = ice->ctx.get_query_result(&ice->ctx, (void *)q, wait, &result);
|
|
if (!ret)
|
|
return true;
|
|
|
|
return ice->condition.condition ? result.u64 == 0 : result.u64 != 0;
|
|
}
|