|
|
|
/**************************************************************************
|
|
|
|
*
|
|
|
|
* Copyright (C) 2014 Red Hat Inc.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
|
|
* to deal in the Software without restriction, including without limitation
|
|
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included
|
|
|
|
* in all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
*
|
|
|
|
**************************************************************************/
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <time.h>
|
|
|
|
|
|
|
|
#include <epoxy/gl.h>
|
|
|
|
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <fcntl.h>
|
|
|
|
#include <errno.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#include "pipe/p_state.h"
|
|
|
|
#include "util/u_format.h"
|
|
|
|
#include "util/u_math.h"
|
|
|
|
#include "vrend_renderer.h"
|
|
|
|
#include "vrend_winsys.h"
|
|
|
|
|
|
|
|
#include "virglrenderer.h"
|
|
|
|
#include "virglrenderer_hw.h"
|
|
|
|
|
|
|
|
#include "virgl_context.h"
|
|
|
|
#include "virgl_resource.h"
|
|
|
|
|
|
|
|
struct global_state {
|
|
|
|
void *cookie;
|
|
|
|
const struct virgl_renderer_callbacks *cbs;
|
|
|
|
|
|
|
|
bool vrend_initialized;
|
|
|
|
};
|
|
|
|
|
|
|
|
static struct global_state state;
|
|
|
|
|
|
|
|
/* new API - just wrap internal API for now */
|
|
|
|
|
|
|
|
static int virgl_renderer_resource_create_internal(struct virgl_renderer_resource_create_args *args,
|
|
|
|
UNUSED struct iovec *iov, UNUSED uint32_t num_iovs,
|
|
|
|
void *image)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
struct pipe_resource *pipe_res;
|
|
|
|
struct vrend_renderer_resource_create_args vrend_args = { 0 };
|
|
|
|
|
|
|
|
/* do not accept handle 0 */
|
|
|
|
if (args->handle == 0)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
vrend_args.target = args->target;
|
|
|
|
vrend_args.format = args->format;
|
|
|
|
vrend_args.bind = args->bind;
|
|
|
|
vrend_args.width = args->width;
|
|
|
|
vrend_args.height = args->height;
|
|
|
|
vrend_args.depth = args->depth;
|
|
|
|
vrend_args.array_size = args->array_size;
|
|
|
|
vrend_args.nr_samples = args->nr_samples;
|
|
|
|
vrend_args.last_level = args->last_level;
|
|
|
|
vrend_args.flags = args->flags;
|
|
|
|
|
|
|
|
pipe_res = vrend_renderer_resource_create(&vrend_args, image);
|
|
|
|
if (!pipe_res)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
ret = virgl_resource_create_from_pipe(args->handle, pipe_res, iov, num_iovs);
|
|
|
|
if (ret) {
|
|
|
|
vrend_renderer_resource_destroy((struct vrend_resource *)pipe_res);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_create(struct virgl_renderer_resource_create_args *args,
|
|
|
|
struct iovec *iov, uint32_t num_iovs)
|
|
|
|
{
|
|
|
|
return virgl_renderer_resource_create_internal(args, iov, num_iovs, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_import_eglimage(struct virgl_renderer_resource_create_args *args, void *image)
|
|
|
|
{
|
|
|
|
return virgl_renderer_resource_create_internal(args, NULL, 0, image);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_resource_set_priv(uint32_t res_handle, void *priv)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res)
|
|
|
|
return;
|
|
|
|
|
|
|
|
res->private_data = priv;
|
|
|
|
}
|
|
|
|
|
|
|
|
void *virgl_renderer_resource_get_priv(uint32_t res_handle)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
return res->private_data;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool detach_resource(struct virgl_context *ctx, void *data)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = data;
|
|
|
|
ctx->detach_resource(ctx, res);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_resource_unref(uint32_t res_handle)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
struct virgl_context_foreach_args args;
|
|
|
|
|
|
|
|
if (!res)
|
|
|
|
return;
|
|
|
|
|
|
|
|
args.callback = detach_resource;
|
|
|
|
args.data = res;
|
|
|
|
virgl_context_foreach(&args);
|
|
|
|
|
|
|
|
virgl_resource_remove(res->res_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_fill_caps(uint32_t set, uint32_t version,
|
|
|
|
void *caps)
|
|
|
|
{
|
|
|
|
switch (set) {
|
|
|
|
case VIRGL_RENDERER_CAPSET_VIRGL:
|
|
|
|
vrend_renderer_fill_caps(VREND_CAP_SET, version, (union virgl_caps *)caps);
|
|
|
|
break;
|
|
|
|
case VIRGL_RENDERER_CAPSET_VIRGL2:
|
|
|
|
vrend_renderer_fill_caps(VREND_CAP_SET2, version, (union virgl_caps *)caps);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_context_create(uint32_t handle, uint32_t nlen, const char *name)
|
|
|
|
{
|
|
|
|
struct virgl_context *ctx;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* user context id must be greater than 0 */
|
|
|
|
if (handle == 0)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
if (virgl_context_lookup(handle))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
ctx = vrend_renderer_context_create(handle, nlen, name);
|
|
|
|
if (!ctx)
|
|
|
|
return ENOMEM;
|
|
|
|
|
|
|
|
ret = virgl_context_add(ctx);
|
|
|
|
if (ret) {
|
|
|
|
ctx->destroy(ctx);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_context_destroy(uint32_t handle)
|
|
|
|
{
|
|
|
|
virgl_context_remove(handle);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_submit_cmd(void *buffer,
|
|
|
|
int ctx_id,
|
|
|
|
int ndw)
|
|
|
|
{
|
|
|
|
struct virgl_context *ctx = virgl_context_lookup(ctx_id);
|
|
|
|
if (!ctx)
|
|
|
|
return EINVAL;
|
|
|
|
return ctx->submit_cmd(ctx, buffer, sizeof(uint32_t) * ndw);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_transfer_write_iov(uint32_t handle,
|
|
|
|
uint32_t ctx_id,
|
|
|
|
int level,
|
|
|
|
uint32_t stride,
|
|
|
|
uint32_t layer_stride,
|
|
|
|
struct virgl_box *box,
|
|
|
|
uint64_t offset,
|
|
|
|
struct iovec *iovec,
|
|
|
|
unsigned int iovec_cnt)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(handle);
|
|
|
|
struct vrend_transfer_info transfer_info;
|
|
|
|
|
|
|
|
if (!res)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
transfer_info.level = level;
|
|
|
|
transfer_info.stride = stride;
|
|
|
|
transfer_info.layer_stride = layer_stride;
|
|
|
|
transfer_info.box = (struct pipe_box *)box;
|
|
|
|
transfer_info.offset = offset;
|
|
|
|
transfer_info.iovec = iovec;
|
|
|
|
transfer_info.iovec_cnt = iovec_cnt;
|
|
|
|
transfer_info.synchronized = false;
|
|
|
|
|
|
|
|
if (ctx_id) {
|
|
|
|
struct virgl_context *ctx = virgl_context_lookup(ctx_id);
|
|
|
|
if (!ctx)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
return ctx->transfer_3d(ctx, res, &transfer_info,
|
|
|
|
VIRGL_TRANSFER_TO_HOST);
|
|
|
|
} else {
|
|
|
|
if (!res->pipe_resource)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_transfer_pipe(res->pipe_resource, &transfer_info,
|
|
|
|
VIRGL_TRANSFER_TO_HOST);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_transfer_read_iov(uint32_t handle, uint32_t ctx_id,
|
|
|
|
uint32_t level, uint32_t stride,
|
|
|
|
uint32_t layer_stride,
|
|
|
|
struct virgl_box *box,
|
|
|
|
uint64_t offset, struct iovec *iovec,
|
|
|
|
int iovec_cnt)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(handle);
|
|
|
|
struct vrend_transfer_info transfer_info;
|
|
|
|
|
|
|
|
if (!res)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
transfer_info.level = level;
|
|
|
|
transfer_info.stride = stride;
|
|
|
|
transfer_info.layer_stride = layer_stride;
|
|
|
|
transfer_info.box = (struct pipe_box *)box;
|
|
|
|
transfer_info.offset = offset;
|
|
|
|
transfer_info.iovec = iovec;
|
|
|
|
transfer_info.iovec_cnt = iovec_cnt;
|
|
|
|
transfer_info.synchronized = false;
|
|
|
|
|
|
|
|
if (ctx_id) {
|
|
|
|
struct virgl_context *ctx = virgl_context_lookup(ctx_id);
|
|
|
|
if (!ctx)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
return ctx->transfer_3d(ctx, res, &transfer_info,
|
|
|
|
VIRGL_TRANSFER_FROM_HOST);
|
|
|
|
} else {
|
|
|
|
if (!res->pipe_resource)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_transfer_pipe(res->pipe_resource, &transfer_info,
|
|
|
|
VIRGL_TRANSFER_FROM_HOST);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_attach_iov(int res_handle, struct iovec *iov,
|
|
|
|
int num_iovs)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
return virgl_resource_attach_iov(res, iov, num_iovs);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_resource_detach_iov(int res_handle, struct iovec **iov_p, int *num_iovs_p)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (iov_p)
|
|
|
|
*iov_p = (struct iovec *)res->iov;
|
|
|
|
if (num_iovs_p)
|
|
|
|
*num_iovs_p = res->iov_count;
|
|
|
|
|
|
|
|
virgl_resource_detach_iov(res);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_create_fence(int client_fence_id, uint32_t ctx_id)
|
|
|
|
{
|
|
|
|
return vrend_renderer_create_fence(client_fence_id, ctx_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_force_ctx_0(void)
|
|
|
|
{
|
|
|
|
vrend_renderer_force_ctx_0();
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_ctx_attach_resource(int ctx_id, int res_handle)
|
|
|
|
{
|
|
|
|
struct virgl_context *ctx = virgl_context_lookup(ctx_id);
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!ctx || !res)
|
|
|
|
return;
|
|
|
|
ctx->attach_resource(ctx, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_ctx_detach_resource(int ctx_id, int res_handle)
|
|
|
|
{
|
|
|
|
struct virgl_context *ctx = virgl_context_lookup(ctx_id);
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!ctx || !res)
|
|
|
|
return;
|
|
|
|
ctx->detach_resource(ctx, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_get_info(int res_handle,
|
|
|
|
struct virgl_renderer_resource_info *info)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return EINVAL;
|
|
|
|
if (!info)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
vrend_renderer_resource_get_info(res->pipe_resource,
|
|
|
|
(struct vrend_renderer_resource_info *)info);
|
|
|
|
info->handle = res_handle;
|
|
|
|
|
|
|
|
return vrend_winsys_get_fourcc_for_texture(info->tex_id,
|
|
|
|
info->virgl_format,
|
|
|
|
&info->drm_fourcc);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_get_cap_set(uint32_t cap_set, uint32_t *max_ver,
|
|
|
|
uint32_t *max_size)
|
|
|
|
{
|
|
|
|
switch (cap_set) {
|
|
|
|
case VIRGL_RENDERER_CAPSET_VIRGL:
|
|
|
|
vrend_renderer_get_cap_set(VREND_CAP_SET, max_ver, max_size);
|
|
|
|
break;
|
|
|
|
case VIRGL_RENDERER_CAPSET_VIRGL2:
|
|
|
|
vrend_renderer_get_cap_set(VREND_CAP_SET2, max_ver, max_size);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
*max_ver = 0;
|
|
|
|
*max_size = 0;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_get_rect(int resource_id, struct iovec *iov, unsigned int num_iovs,
|
|
|
|
uint32_t offset, int x, int y, int width, int height)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(resource_id);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return;
|
|
|
|
|
|
|
|
vrend_renderer_get_rect(res->pipe_resource, iov, num_iovs, offset, x, y,
|
|
|
|
width, height);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static void virgl_write_fence(uint32_t fence_id)
|
|
|
|
{
|
|
|
|
state.cbs->write_fence(state.cookie, fence_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
static virgl_renderer_gl_context create_gl_context(int scanout_idx, struct virgl_gl_ctx_param *param)
|
|
|
|
{
|
|
|
|
struct virgl_renderer_gl_ctx_param vparam;
|
|
|
|
|
|
|
|
if (use_context != CONTEXT_NONE)
|
|
|
|
return vrend_winsys_create_context(param);
|
|
|
|
|
|
|
|
vparam.version = 1;
|
|
|
|
vparam.shared = param->shared;
|
|
|
|
vparam.major_ver = param->major_ver;
|
|
|
|
vparam.minor_ver = param->minor_ver;
|
|
|
|
return state.cbs->create_gl_context(state.cookie, scanout_idx, &vparam);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void destroy_gl_context(virgl_renderer_gl_context ctx)
|
|
|
|
{
|
|
|
|
if (use_context != CONTEXT_NONE) {
|
|
|
|
vrend_winsys_destroy_context(ctx);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
state.cbs->destroy_gl_context(state.cookie, ctx);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int make_current(virgl_renderer_gl_context ctx)
|
|
|
|
{
|
|
|
|
if (use_context != CONTEXT_NONE)
|
|
|
|
return vrend_winsys_make_context_current(ctx);
|
|
|
|
|
|
|
|
return state.cbs->make_current(state.cookie, 0, ctx);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct vrend_if_cbs vrend_cbs = {
|
|
|
|
virgl_write_fence,
|
|
|
|
create_gl_context,
|
|
|
|
destroy_gl_context,
|
|
|
|
make_current,
|
|
|
|
};
|
|
|
|
|
|
|
|
void *virgl_renderer_get_cursor_data(uint32_t resource_id, uint32_t *width, uint32_t *height)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(resource_id);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
vrend_renderer_force_ctx_0();
|
|
|
|
return vrend_renderer_get_cursor_contents(res->pipe_resource,
|
|
|
|
width,
|
|
|
|
height);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_poll(void)
|
|
|
|
{
|
|
|
|
if (state.vrend_initialized)
|
|
|
|
vrend_renderer_check_fences();
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_cleanup(UNUSED void *cookie)
|
|
|
|
{
|
|
|
|
if (state.vrend_initialized) {
|
|
|
|
vrend_renderer_prepare_reset();
|
|
|
|
virgl_context_table_reset();
|
|
|
|
virgl_resource_table_cleanup();
|
|
|
|
vrend_renderer_fini();
|
|
|
|
}
|
|
|
|
|
|
|
|
virgl_context_table_cleanup();
|
|
|
|
vrend_winsys_cleanup();
|
|
|
|
|
|
|
|
memset(&state, 0, sizeof(state));
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_init(void *cookie, int flags, struct virgl_renderer_callbacks *cbs)
|
|
|
|
{
|
|
|
|
int drm_fd = -1;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (!cookie || !cbs)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (cbs->version < 1 || cbs->version > VIRGL_RENDERER_CALLBACKS_VERSION)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
state.cookie = cookie;
|
|
|
|
state.cbs = cbs;
|
|
|
|
|
|
|
|
if (flags & VIRGL_RENDERER_USE_EGL) {
|
|
|
|
if (cbs->version >= 2 && cbs->get_drm_fd) {
|
|
|
|
drm_fd = cbs->get_drm_fd(cookie);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ret = vrend_winsys_init(flags, drm_fd);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
if (virgl_context_table_init())
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (!state.vrend_initialized) {
|
|
|
|
uint32_t renderer_flags = 0;
|
|
|
|
|
|
|
|
if (flags & VIRGL_RENDERER_THREAD_SYNC)
|
|
|
|
renderer_flags |= VREND_USE_THREAD_SYNC;
|
|
|
|
if (flags & VIRGL_RENDERER_USE_EXTERNAL_BLOB)
|
|
|
|
renderer_flags |= VREND_USE_EXTERNAL_BLOB;
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
|
|
|
|
ret = vrend_renderer_init(&vrend_cbs, renderer_flags);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
state.vrend_initialized = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_get_fd_for_texture(uint32_t tex_id, int *fd)
|
|
|
|
{
|
|
|
|
return vrend_winsys_get_fd_for_texture(tex_id, fd);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_get_fd_for_texture2(uint32_t tex_id, int *fd, int *stride, int *offset)
|
|
|
|
{
|
|
|
|
return vrend_winsys_get_fd_for_texture2(tex_id, fd, stride, offset);
|
|
|
|
}
|
|
|
|
|
|
|
|
void virgl_renderer_reset(void)
|
|
|
|
{
|
|
|
|
if (state.vrend_initialized) {
|
|
|
|
vrend_renderer_prepare_reset();
|
|
|
|
virgl_context_table_reset();
|
|
|
|
virgl_resource_table_reset();
|
|
|
|
vrend_renderer_reset();
|
|
|
|
}
|
|
|
|
}
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
|
|
|
|
int virgl_renderer_get_poll_fd(void)
|
|
|
|
{
|
|
|
|
if (state.vrend_initialized)
|
|
|
|
return vrend_renderer_get_poll_fd();
|
|
|
|
|
|
|
|
return -1;
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
}
|
|
|
|
|
|
|
|
virgl_debug_callback_type virgl_set_debug_callback(virgl_debug_callback_type cb)
|
|
|
|
{
|
|
|
|
return vrend_set_debug_callback(cb);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int virgl_renderer_export_query(void *execute_args, uint32_t execute_size)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res;
|
|
|
|
struct virgl_renderer_export_query *export_query = execute_args;
|
|
|
|
if (execute_size != sizeof(struct virgl_renderer_export_query))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (export_query->hdr.size != sizeof(struct virgl_renderer_export_query))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
res = virgl_resource_lookup(export_query->in_resource_id);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_export_query(res->pipe_resource, export_query);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int virgl_renderer_supported_structures(void *execute_args, uint32_t execute_size)
|
|
|
|
{
|
|
|
|
struct virgl_renderer_supported_structures *supported_structures = execute_args;
|
|
|
|
if (execute_size != sizeof(struct virgl_renderer_supported_structures))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (supported_structures->hdr.size != sizeof(struct virgl_renderer_supported_structures))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (supported_structures->in_stype_version == 0) {
|
|
|
|
supported_structures->out_supported_structures_mask =
|
|
|
|
VIRGL_RENDERER_STRUCTURE_TYPE_EXPORT_QUERY |
|
|
|
|
VIRGL_RENDERER_STRUCTURE_TYPE_SUPPORTED_STRUCTURES;
|
|
|
|
} else {
|
|
|
|
supported_structures->out_supported_structures_mask = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_execute(void *execute_args, uint32_t execute_size)
|
|
|
|
{
|
|
|
|
struct virgl_renderer_hdr *hdr = execute_args;
|
|
|
|
if (hdr->stype_version != 0)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
switch (hdr->stype) {
|
|
|
|
case VIRGL_RENDERER_STRUCTURE_TYPE_SUPPORTED_STRUCTURES:
|
|
|
|
return virgl_renderer_supported_structures(execute_args, execute_size);
|
|
|
|
case VIRGL_RENDERER_STRUCTURE_TYPE_EXPORT_QUERY:
|
|
|
|
return virgl_renderer_export_query(execute_args, execute_size);
|
|
|
|
default:
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_create_blob(const struct virgl_renderer_resource_create_blob_args *args)
|
|
|
|
{
|
|
|
|
struct virgl_context *ctx;
|
|
|
|
struct virgl_context_blob blob;
|
|
|
|
bool has_host_storage;
|
|
|
|
bool has_guest_storage;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
switch (args->blob_mem) {
|
|
|
|
case VIRGL_RENDERER_BLOB_MEM_GUEST:
|
|
|
|
has_host_storage = false;
|
|
|
|
has_guest_storage = true;
|
|
|
|
break;
|
|
|
|
case VIRGL_RENDERER_BLOB_MEM_HOST3D:
|
|
|
|
has_host_storage = true;
|
|
|
|
has_guest_storage = false;
|
|
|
|
break;
|
|
|
|
case VIRGL_RENDERER_BLOB_MEM_HOST3D_GUEST:
|
|
|
|
has_host_storage = true;
|
|
|
|
has_guest_storage = true;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* user resource id must be greater than 0 */
|
|
|
|
if (args->res_handle == 0)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (args->size == 0)
|
|
|
|
return -EINVAL;
|
|
|
|
if (has_guest_storage) {
|
|
|
|
const size_t iov_size = vrend_get_iovec_size(args->iovecs, args->num_iovs);
|
|
|
|
if (iov_size < args->size)
|
|
|
|
return -EINVAL;
|
|
|
|
} else {
|
|
|
|
if (args->num_iovs)
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!has_host_storage) {
|
|
|
|
return virgl_resource_create_from_iov(args->res_handle,
|
|
|
|
args->iovecs,
|
|
|
|
args->num_iovs);
|
|
|
|
}
|
|
|
|
|
|
|
|
ctx = virgl_context_lookup(args->ctx_id);
|
|
|
|
if (!ctx)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
ret = ctx->get_blob(ctx, args->blob_id, args->blob_flags, &blob);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
if (blob.type != VIRGL_RESOURCE_FD_INVALID) {
|
|
|
|
ret = virgl_resource_create_from_fd(args->res_handle,
|
|
|
|
blob.type,
|
|
|
|
blob.u.fd,
|
|
|
|
args->iovecs,
|
|
|
|
args->num_iovs);
|
|
|
|
if (ret) {
|
|
|
|
close(blob.u.fd);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
ret = virgl_resource_create_from_pipe(args->res_handle,
|
|
|
|
blob.u.pipe_resource,
|
|
|
|
args->iovecs,
|
|
|
|
args->num_iovs);
|
|
|
|
if (ret) {
|
|
|
|
vrend_renderer_resource_destroy((struct vrend_resource *)blob.u.pipe_resource);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (ctx->get_blob_done)
|
|
|
|
ctx->get_blob_done(ctx, args->res_handle, &blob);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_map(uint32_t res_handle, void **map, uint64_t *out_size)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_resource_map(res->pipe_resource, map, out_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_unmap(uint32_t res_handle)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_resource_unmap(res->pipe_resource);
|
|
|
|
}
|
|
|
|
|
|
|
|
int virgl_renderer_resource_get_map_info(uint32_t res_handle, uint32_t *map_info)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_handle);
|
|
|
|
if (!res || !res->pipe_resource)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
return vrend_renderer_resource_get_map_info(res->pipe_resource, map_info);
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
virgl_renderer_resource_export_blob(uint32_t res_id, uint32_t *fd_type, int *fd)
|
|
|
|
{
|
|
|
|
struct virgl_resource *res = virgl_resource_lookup(res_id);
|
|
|
|
if (!res)
|
|
|
|
return EINVAL;
|
|
|
|
|
|
|
|
switch (virgl_resource_export_fd(res, fd)) {
|
|
|
|
case VIRGL_RESOURCE_FD_DMABUF:
|
|
|
|
*fd_type = VIRGL_RENDERER_BLOB_FD_TYPE_DMABUF;
|
|
|
|
break;
|
|
|
|
case VIRGL_RESOURCE_FD_OPAQUE:
|
|
|
|
*fd_type = VIRGL_RENDERER_BLOB_FD_TYPE_OPAQUE;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|