|
|
|
/**************************************************************************
|
|
|
|
*
|
|
|
|
* Copyright (C) 2014 Red Hat Inc.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
|
|
* to deal in the Software without restriction, including without limitation
|
|
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included
|
|
|
|
* in all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
*
|
|
|
|
**************************************************************************/
|
|
|
|
|
|
|
|
#ifndef VREND_RENDERER_H
|
|
|
|
#define VREND_RENDERER_H
|
|
|
|
|
|
|
|
#include "pipe/p_state.h"
|
|
|
|
#include "util/u_double_list.h"
|
|
|
|
#include "util/u_inlines.h"
|
|
|
|
#include "virgl_protocol.h"
|
|
|
|
#include "vrend_debug.h"
|
|
|
|
#include "vrend_tweaks.h"
|
|
|
|
#include "vrend_iov.h"
|
|
|
|
#include "vrend_winsys_gbm.h"
|
|
|
|
#include "virgl_hw.h"
|
|
|
|
#include <epoxy/gl.h>
|
|
|
|
|
|
|
|
typedef void *virgl_gl_context;
|
|
|
|
typedef void *virgl_gl_drawable;
|
|
|
|
|
|
|
|
struct virgl_gl_ctx_param {
|
|
|
|
int major_ver;
|
|
|
|
int minor_ver;
|
|
|
|
bool shared;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct virgl_context;
|
|
|
|
struct vrend_context;
|
|
|
|
|
|
|
|
/* Number of mipmap levels for which to keep the backing iov offsets.
|
|
|
|
* Value mirrored from mesa/virgl
|
|
|
|
*/
|
|
|
|
#define VR_MAX_TEXTURE_2D_LEVELS 15
|
|
|
|
|
|
|
|
#define VREND_STORAGE_GUEST_MEMORY BIT(0)
|
|
|
|
#define VREND_STORAGE_GL_TEXTURE BIT(1)
|
|
|
|
#define VREND_STORAGE_GL_BUFFER BIT(2)
|
|
|
|
#define VREND_STORAGE_EGL_IMAGE BIT(3)
|
|
|
|
#define VREND_STORAGE_GBM_BUFFER BIT(4)
|
|
|
|
#define VREND_STORAGE_HOST_SYSTEM_MEMORY BIT(5)
|
|
|
|
#define VREND_STORAGE_GL_IMMUTABLE BIT(6)
|
|
|
|
#define VREND_STORAGE_GL_MEMOBJ BIT(7)
|
|
|
|
|
|
|
|
struct vrend_resource {
|
|
|
|
struct pipe_resource base;
|
|
|
|
uint32_t storage_bits;
|
|
|
|
uint32_t map_info;
|
|
|
|
|
|
|
|
GLuint id;
|
|
|
|
GLenum target;
|
|
|
|
|
|
|
|
/* fb id if we need to readback this resource */
|
|
|
|
GLuint readback_fb_id;
|
|
|
|
GLuint readback_fb_level;
|
|
|
|
GLuint readback_fb_z;
|
|
|
|
|
|
|
|
GLuint tbo_tex_id;/* tbos have two ids to track */
|
|
|
|
bool y_0_top;
|
|
|
|
|
|
|
|
/* Pointer to system memory storage for this resource. Only valid for
|
|
|
|
* VREND_RESOURCE_STORAGE_GUEST_ELSE_SYSTEM buffer storage.
|
|
|
|
*/
|
|
|
|
char *ptr;
|
|
|
|
/* IOV pointing to shared guest memory storage for this resource. */
|
|
|
|
const struct iovec *iov;
|
|
|
|
uint32_t num_iovs;
|
|
|
|
uint64_t mipmap_offsets[VR_MAX_TEXTURE_2D_LEVELS];
|
|
|
|
void *gbm_bo, *egl_image;
|
|
|
|
void *aux_plane_egl_image[VIRGL_GBM_MAX_PLANES];
|
|
|
|
|
|
|
|
uint64_t size;
|
|
|
|
GLbitfield buffer_storage_flags;
|
|
|
|
GLuint memobj;
|
|
|
|
|
|
|
|
uint32_t blob_id;
|
|
|
|
struct list_head head;
|
|
|
|
};
|
|
|
|
|
|
|
|
#define VIRGL_TEXTURE_NEED_SWIZZLE (1 << 0)
|
|
|
|
#define VIRGL_TEXTURE_CAN_TEXTURE_STORAGE (1 << 1)
|
|
|
|
#define VIRGL_TEXTURE_CAN_READBACK (1 << 2)
|
|
|
|
|
|
|
|
struct vrend_format_table {
|
|
|
|
enum virgl_formats format;
|
|
|
|
GLenum internalformat;
|
|
|
|
GLenum glformat;
|
|
|
|
GLenum gltype;
|
|
|
|
uint8_t swizzle[4];
|
|
|
|
uint32_t bindings;
|
|
|
|
uint32_t flags;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct vrend_if_cbs {
|
|
|
|
void (*write_fence)(unsigned fence_id);
|
|
|
|
|
|
|
|
virgl_gl_context (*create_gl_context)(int scanout, struct virgl_gl_ctx_param *params);
|
|
|
|
void (*destroy_gl_context)(virgl_gl_context ctx);
|
|
|
|
int (*make_current)(virgl_gl_context ctx);
|
|
|
|
};
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
|
|
|
|
#define VREND_USE_THREAD_SYNC 1
|
|
|
|
#define VREND_USE_EXTERNAL_BLOB 2
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
|
|
|
|
const struct virgl_resource_pipe_callbacks *
|
|
|
|
vrend_renderer_get_pipe_callbacks(void);
|
|
|
|
|
|
|
|
int vrend_renderer_init(const struct vrend_if_cbs *cbs, uint32_t flags);
|
|
|
|
|
|
|
|
void vrend_insert_format(struct vrend_format_table *entry, uint32_t bindings, uint32_t flags);
|
|
|
|
bool vrend_check_framebuffer_mixed_color_attachements(void);
|
|
|
|
|
|
|
|
void vrend_insert_format_swizzle(int override_format, struct vrend_format_table *entry,
|
|
|
|
uint32_t bindings, uint8_t swizzle[4], uint32_t flags);
|
|
|
|
const struct vrend_format_table *vrend_get_format_table_entry(enum virgl_formats format);
|
|
|
|
const struct vrend_format_table *vrend_get_format_table_entry_with_emulation(uint32_t bind, enum virgl_formats format);
|
|
|
|
|
|
|
|
int vrend_create_shader(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
const struct pipe_stream_output_info *stream_output,
|
|
|
|
uint32_t req_local_mem,
|
|
|
|
const char *shd_text, uint32_t offlen, uint32_t num_tokens,
|
|
|
|
uint32_t type, uint32_t pkt_length);
|
|
|
|
|
|
|
|
void vrend_bind_shader(struct vrend_context *ctx,
|
|
|
|
uint32_t type,
|
|
|
|
uint32_t handle);
|
|
|
|
|
|
|
|
void vrend_bind_vs_so(struct vrend_context *ctx,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_clear(struct vrend_context *ctx,
|
|
|
|
unsigned buffers,
|
|
|
|
const union pipe_color_union *color,
|
|
|
|
double depth, unsigned stencil);
|
|
|
|
|
|
|
|
void vrend_clear_texture(struct vrend_context* ctx,
|
|
|
|
uint32_t handle, uint32_t level,
|
|
|
|
const struct pipe_box *box,
|
|
|
|
const void * data);
|
|
|
|
|
|
|
|
int vrend_draw_vbo(struct vrend_context *ctx,
|
|
|
|
const struct pipe_draw_info *info,
|
|
|
|
uint32_t cso, uint32_t indirect_handle, uint32_t indirect_draw_count_handle);
|
|
|
|
|
|
|
|
void vrend_set_framebuffer_state(struct vrend_context *ctx,
|
|
|
|
uint32_t nr_cbufs, uint32_t surf_handle[PIPE_MAX_COLOR_BUFS],
|
|
|
|
uint32_t zsurf_handle);
|
|
|
|
|
|
|
|
struct vrend_context *vrend_create_context(int id, uint32_t nlen, const char *debug_name);
|
|
|
|
void vrend_destroy_context(struct vrend_context *ctx);
|
|
|
|
struct virgl_context *vrend_renderer_context_create(uint32_t handle,
|
|
|
|
uint32_t nlen,
|
|
|
|
const char *name);
|
|
|
|
|
|
|
|
struct vrend_renderer_resource_create_args {
|
|
|
|
enum pipe_texture_target target;
|
|
|
|
uint32_t format;
|
|
|
|
uint32_t bind;
|
|
|
|
uint32_t width;
|
|
|
|
uint32_t height;
|
|
|
|
uint32_t depth;
|
|
|
|
uint32_t array_size;
|
|
|
|
uint32_t last_level;
|
|
|
|
uint32_t nr_samples;
|
|
|
|
uint32_t flags;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct pipe_resource *
|
|
|
|
vrend_renderer_resource_create(const struct vrend_renderer_resource_create_args *args,
|
|
|
|
void *image_eos);
|
|
|
|
|
|
|
|
int vrend_create_surface(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
uint32_t res_handle, uint32_t format,
|
|
|
|
uint32_t val0, uint32_t val1);
|
|
|
|
int vrend_create_sampler_view(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
uint32_t res_handle, uint32_t format,
|
|
|
|
uint32_t val0, uint32_t val1, uint32_t swizzle_packed);
|
|
|
|
|
|
|
|
int vrend_create_sampler_state(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
struct pipe_sampler_state *templ);
|
|
|
|
|
|
|
|
int vrend_create_so_target(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
uint32_t res_handle,
|
|
|
|
uint32_t buffer_offset,
|
|
|
|
uint32_t buffer_size);
|
|
|
|
|
|
|
|
void vrend_set_streamout_targets(struct vrend_context *ctx,
|
|
|
|
uint32_t append_bitmask,
|
|
|
|
uint32_t num_targets,
|
|
|
|
uint32_t *handles);
|
|
|
|
|
|
|
|
int vrend_create_vertex_elements_state(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
unsigned num_elements,
|
|
|
|
const struct pipe_vertex_element *elements);
|
|
|
|
void vrend_bind_vertex_elements_state(struct vrend_context *ctx,
|
|
|
|
uint32_t handle);
|
|
|
|
|
|
|
|
void vrend_set_single_vbo(struct vrend_context *ctx,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t stride,
|
|
|
|
uint32_t buffer_offset,
|
|
|
|
uint32_t res_handle);
|
|
|
|
void vrend_set_num_vbo(struct vrend_context *ctx,
|
|
|
|
int num_vbo);
|
|
|
|
|
|
|
|
int vrend_transfer_inline_write(struct vrend_context *ctx,
|
|
|
|
uint32_t dst_handle,
|
|
|
|
const struct vrend_transfer_info *info);
|
|
|
|
|
|
|
|
int vrend_renderer_copy_transfer3d(struct vrend_context *ctx,
|
|
|
|
uint32_t dst_handle,
|
|
|
|
uint32_t src_handle,
|
|
|
|
const struct vrend_transfer_info *info);
|
|
|
|
|
|
|
|
void vrend_set_viewport_states(struct vrend_context *ctx,
|
|
|
|
uint32_t start_slot, uint32_t num_viewports,
|
|
|
|
const struct pipe_viewport_state *state);
|
|
|
|
void vrend_set_num_sampler_views(struct vrend_context *ctx,
|
|
|
|
uint32_t shader_type,
|
|
|
|
uint32_t start_slot,
|
|
|
|
uint32_t num_sampler_views);
|
|
|
|
void vrend_set_single_sampler_view(struct vrend_context *ctx,
|
|
|
|
uint32_t shader_type,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t res_handle);
|
|
|
|
|
|
|
|
void vrend_object_bind_blend(struct vrend_context *ctx,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_object_bind_dsa(struct vrend_context *ctx,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_object_bind_rasterizer(struct vrend_context *ctx,
|
|
|
|
uint32_t handle);
|
|
|
|
|
|
|
|
void vrend_bind_sampler_states(struct vrend_context *ctx,
|
|
|
|
uint32_t shader_type,
|
|
|
|
uint32_t start_slot,
|
|
|
|
uint32_t num_states,
|
|
|
|
const uint32_t *handles);
|
|
|
|
void vrend_set_index_buffer(struct vrend_context *ctx,
|
|
|
|
uint32_t res_handle,
|
|
|
|
uint32_t index_size,
|
|
|
|
uint32_t offset);
|
|
|
|
void vrend_set_single_image_view(struct vrend_context *ctx,
|
|
|
|
uint32_t shader_type,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t format, uint32_t access,
|
|
|
|
uint32_t layer_offset, uint32_t level_size,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_set_single_ssbo(struct vrend_context *ctx,
|
|
|
|
uint32_t shader_type,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t offset, uint32_t length,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_set_single_abo(struct vrend_context *ctx,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t offset, uint32_t length,
|
|
|
|
uint32_t handle);
|
|
|
|
void vrend_memory_barrier(struct vrend_context *ctx,
|
|
|
|
unsigned flags);
|
|
|
|
void vrend_launch_grid(struct vrend_context *ctx,
|
|
|
|
uint32_t *block,
|
|
|
|
uint32_t *grid,
|
|
|
|
uint32_t indirect_handle,
|
|
|
|
uint32_t indirect_offset);
|
|
|
|
void vrend_set_framebuffer_state_no_attach(struct vrend_context *ctx,
|
|
|
|
uint32_t width, uint32_t height,
|
|
|
|
uint32_t layers, uint32_t samples);
|
|
|
|
void vrend_texture_barrier(struct vrend_context *ctx,
|
|
|
|
unsigned flags);
|
|
|
|
|
|
|
|
int vrend_renderer_transfer_iov(struct vrend_context *ctx,
|
|
|
|
uint32_t dst_handle,
|
|
|
|
const struct vrend_transfer_info *info,
|
|
|
|
int transfer_mode);
|
|
|
|
|
|
|
|
int vrend_renderer_transfer_pipe(struct pipe_resource *pres,
|
|
|
|
const struct vrend_transfer_info *info,
|
|
|
|
int transfer_mode);
|
|
|
|
|
|
|
|
void vrend_renderer_resource_copy_region(struct vrend_context *ctx,
|
|
|
|
uint32_t dst_handle, uint32_t dst_level,
|
|
|
|
uint32_t dstx, uint32_t dsty, uint32_t dstz,
|
|
|
|
uint32_t src_handle, uint32_t src_level,
|
|
|
|
const struct pipe_box *src_box);
|
|
|
|
|
|
|
|
void vrend_renderer_blit(struct vrend_context *ctx,
|
|
|
|
uint32_t dst_handle, uint32_t src_handle,
|
|
|
|
const struct pipe_blit_info *info);
|
|
|
|
|
|
|
|
void vrend_set_stencil_ref(struct vrend_context *ctx, struct pipe_stencil_ref *ref);
|
|
|
|
void vrend_set_blend_color(struct vrend_context *ctx, struct pipe_blend_color *color);
|
|
|
|
void vrend_set_scissor_state(struct vrend_context *ctx,
|
|
|
|
uint32_t start_slot,
|
|
|
|
uint32_t num_scissor,
|
|
|
|
struct pipe_scissor_state *ss);
|
|
|
|
|
|
|
|
void vrend_set_polygon_stipple(struct vrend_context *ctx, struct pipe_poly_stipple *ps);
|
|
|
|
|
|
|
|
void vrend_set_clip_state(struct vrend_context *ctx, struct pipe_clip_state *ucp);
|
|
|
|
void vrend_set_sample_mask(struct vrend_context *ctx, unsigned sample_mask);
|
|
|
|
void vrend_set_min_samples(struct vrend_context *ctx, unsigned min_samples);
|
|
|
|
|
|
|
|
void vrend_set_constants(struct vrend_context *ctx,
|
|
|
|
uint32_t shader,
|
|
|
|
uint32_t index,
|
|
|
|
uint32_t num_constant,
|
|
|
|
const float *data);
|
|
|
|
|
|
|
|
void vrend_set_uniform_buffer(struct vrend_context *ctx, uint32_t shader,
|
|
|
|
uint32_t index, uint32_t offset, uint32_t length,
|
|
|
|
uint32_t res_handle);
|
|
|
|
|
|
|
|
void vrend_fb_bind_texture_id(struct vrend_resource *res,
|
|
|
|
int id,
|
|
|
|
int idx,
|
|
|
|
uint32_t level, uint32_t layer);
|
|
|
|
|
|
|
|
void vrend_set_tess_state(struct vrend_context *ctx, const float tess_factors[6]);
|
|
|
|
|
|
|
|
void vrend_renderer_fini(void);
|
|
|
|
|
|
|
|
int vrend_renderer_create_fence(int client_fence_id, uint32_t ctx_id);
|
|
|
|
|
|
|
|
void vrend_renderer_check_fences(void);
|
|
|
|
|
|
|
|
int vrend_renderer_export_fence(uint32_t fence_id, int* out_fd);
|
|
|
|
|
|
|
|
bool vrend_hw_switch_context(struct vrend_context *ctx, bool now);
|
|
|
|
uint32_t vrend_renderer_object_insert(struct vrend_context *ctx, void *data,
|
|
|
|
uint32_t handle, enum virgl_object_type type);
|
|
|
|
void vrend_renderer_object_destroy(struct vrend_context *ctx, uint32_t handle);
|
|
|
|
|
|
|
|
int vrend_create_query(struct vrend_context *ctx, uint32_t handle,
|
|
|
|
uint32_t query_type, uint32_t query_index,
|
|
|
|
uint32_t res_handle, uint32_t offset);
|
|
|
|
|
|
|
|
int vrend_begin_query(struct vrend_context *ctx, uint32_t handle);
|
|
|
|
int vrend_end_query(struct vrend_context *ctx, uint32_t handle);
|
|
|
|
void vrend_get_query_result(struct vrend_context *ctx, uint32_t handle,
|
|
|
|
uint32_t wait);
|
|
|
|
void vrend_get_query_result_qbo(struct vrend_context *ctx, uint32_t handle,
|
|
|
|
uint32_t qbo_handle,
|
|
|
|
uint32_t wait, uint32_t result_type, uint32_t offset,
|
|
|
|
int32_t index);
|
|
|
|
void vrend_render_condition(struct vrend_context *ctx,
|
|
|
|
uint32_t handle,
|
|
|
|
bool condtion,
|
|
|
|
uint mode);
|
|
|
|
void *vrend_renderer_get_cursor_contents(struct pipe_resource *pres,
|
|
|
|
uint32_t *width,
|
|
|
|
uint32_t *height);
|
|
|
|
|
|
|
|
void vrend_renderer_fill_caps(uint32_t set, uint32_t version,
|
|
|
|
union virgl_caps *caps);
|
|
|
|
|
|
|
|
GLint64 vrend_renderer_get_timestamp(void);
|
|
|
|
|
|
|
|
void vrend_build_format_list_common(void);
|
|
|
|
void vrend_build_format_list_gl(void);
|
|
|
|
void vrend_build_format_list_gles(void);
|
|
|
|
void vrend_build_emulated_format_list_gles(void);
|
|
|
|
void vrend_check_texture_storage(struct vrend_format_table *table);
|
|
|
|
|
|
|
|
void vrend_renderer_resource_destroy(struct vrend_resource *res);
|
|
|
|
|
|
|
|
static inline void
|
|
|
|
vrend_resource_reference(struct vrend_resource **ptr, struct vrend_resource *tex)
|
|
|
|
{
|
|
|
|
struct vrend_resource *old_tex = *ptr;
|
|
|
|
|
|
|
|
if (pipe_reference(&(*ptr)->base.reference, &tex->base.reference))
|
|
|
|
vrend_renderer_resource_destroy(old_tex);
|
|
|
|
*ptr = tex;
|
|
|
|
}
|
|
|
|
|
|
|
|
void vrend_renderer_force_ctx_0(void);
|
|
|
|
|
|
|
|
void vrend_renderer_get_rect(struct pipe_resource *pres,
|
|
|
|
const struct iovec *iov, unsigned int num_iovs,
|
|
|
|
uint32_t offset,
|
|
|
|
int x, int y, int width, int height);
|
|
|
|
|
|
|
|
void vrend_renderer_attach_res_ctx(struct vrend_context *ctx,
|
|
|
|
uint32_t res_id,
|
|
|
|
struct pipe_resource *pres);
|
|
|
|
void vrend_renderer_detach_res_ctx(struct vrend_context *ctx,
|
|
|
|
uint32_t res_id);
|
|
|
|
|
|
|
|
struct vrend_context_tweaks *vrend_get_context_tweaks(struct vrend_context *ctx);
|
|
|
|
|
|
|
|
struct vrend_renderer_resource_info {
|
|
|
|
uint32_t handle;
|
|
|
|
uint32_t format;
|
|
|
|
uint32_t width;
|
|
|
|
uint32_t height;
|
|
|
|
uint32_t depth;
|
|
|
|
uint32_t flags;
|
|
|
|
uint32_t tex_id;
|
|
|
|
uint32_t stride;
|
|
|
|
};
|
|
|
|
|
|
|
|
void vrend_renderer_resource_get_info(struct pipe_resource *pres,
|
|
|
|
struct vrend_renderer_resource_info *info);
|
|
|
|
|
|
|
|
void vrend_renderer_get_cap_set(uint32_t cap_set, uint32_t *max_ver,
|
|
|
|
uint32_t *max_size);
|
|
|
|
|
|
|
|
void vrend_renderer_create_sub_ctx(struct vrend_context *ctx, int sub_ctx_id);
|
|
|
|
void vrend_renderer_destroy_sub_ctx(struct vrend_context *ctx, int sub_ctx_id);
|
|
|
|
void vrend_renderer_set_sub_ctx(struct vrend_context *ctx, int sub_ctx_id);
|
|
|
|
|
|
|
|
void vrend_report_context_error_internal(const char *fname, struct vrend_context *ctx,
|
|
|
|
enum virgl_ctx_errors error, uint32_t value);
|
|
|
|
|
|
|
|
#define vrend_report_context_error(ctx, error, value) \
|
|
|
|
vrend_report_context_error_internal(__func__, ctx, error, value)
|
|
|
|
|
|
|
|
#define vrend_report_buffer_error(ctx, cmd) \
|
|
|
|
vrend_report_context_error(ctx, VIRGL_ERROR_CTX_ILLEGAL_CMD_BUFFER, cmd)
|
|
|
|
|
|
|
|
void vrend_fb_bind_texture(struct vrend_resource *res,
|
|
|
|
int idx,
|
|
|
|
uint32_t level, uint32_t layer);
|
|
|
|
bool vrend_format_is_emulated_alpha(enum virgl_formats format);
|
|
|
|
boolean format_is_copy_compatible(enum virgl_formats src, enum virgl_formats dst,
|
|
|
|
boolean allow_compressed);
|
|
|
|
|
|
|
|
/* blitter interface */
|
|
|
|
void vrend_renderer_blit_gl(struct vrend_context *ctx,
|
|
|
|
struct vrend_resource *src_res,
|
|
|
|
struct vrend_resource *dst_res,
|
|
|
|
GLenum blit_views[2],
|
|
|
|
const struct pipe_blit_info *info,
|
|
|
|
bool has_texture_srgb_decode,
|
|
|
|
bool has_srgb_write_control,
|
|
|
|
bool skip_dest_swizzle);
|
|
|
|
void vrend_blitter_fini(void);
|
|
|
|
|
|
|
|
void vrend_renderer_prepare_reset(void);
|
|
|
|
void vrend_renderer_reset(void);
|
renderer: use a thread to block for fences.
Instead of polling the fences regularly, have a thread
that blocks for a single fence using a separate shared
context, then uses eventfd to wake up the main thread
when something happens.
Inside the guest, glmark2 typicially runs twice as fast with the thread
sync. Although in general, the performances seems to be about +30%. The
benefits is mostly for CPU-bounds tasks (when main the thread hits 100%)
A naive perf stat of the vtest renderer with glmark2 "build" test with a
fixed number of frames (500) results in the following stats data:
(do not value timing related informations, since the renderer is ran and
stopped manually)
without thread:
3032.282265 task-clock (msec) # 0.420 CPUs utilized
4,277 context-switches # 0.001 M/sec
102 cpu-migrations # 0.034 K/sec
9,020 page-faults # 0.003 M/sec
7,884,098,254 cycles # 2.600 GHz
4,440,126,451 stalled-cycles-frontend # 56.32% frontend cycles idle
<not supported> stalled-cycles-backend
11,024,091,578 instructions # 1.40 insns per cycle
# 0.40 stalled
# cycles per insn
1,091,831,588 branches # 360.069 M/sec
5,426,846 branch-misses # 0.50% of all branches
with thread:
3403.592921 task-clock (msec) # 0.452 CPUs utilized
7,145 context-switches # 0.002 M/sec
410 cpu-migrations # 0.120 K/sec
6,191 page-faults # 0.002 M/sec
7,475,038,064 cycles # 2.196 GHz
4,487,043,071 stalled-cycles-frontend # 60.03% frontend cycles idle
<not supported> stalled-cycles-backend
9,925,205,494 instructions # 1.33 insns per cycle
# 0.45 stalled
# cycles per insn
834,375,503 branches # 245.146 M/sec
4,919,995 branch-misses # 0.59% of all branches
Signed-off-by: Marc-André Lureau <marcandre.lureau@gmail.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
9 years ago
|
|
|
int vrend_renderer_get_poll_fd(void);
|
|
|
|
|
|
|
|
unsigned vrend_context_has_debug_flag(const struct vrend_context *ctx,
|
|
|
|
enum virgl_debug_flags flag);
|
|
|
|
|
|
|
|
unsigned vrend_renderer_query_multisample_caps(unsigned max_samples,
|
|
|
|
struct virgl_caps_v2 *caps);
|
|
|
|
|
|
|
|
struct gl_version {
|
|
|
|
uint32_t major;
|
|
|
|
uint32_t minor;
|
|
|
|
};
|
|
|
|
|
|
|
|
static const struct gl_version gl_versions[] = { {4,6}, {4,5}, {4,4}, {4,3}, {4,2}, {4,1}, {4,0},
|
|
|
|
{3,3}, {3,2}, {3,1}, {3,0} };
|
|
|
|
|
|
|
|
extern const struct vrend_if_cbs *vrend_clicbs;
|
|
|
|
|
|
|
|
int vrend_renderer_export_query(struct pipe_resource *pres,
|
|
|
|
struct virgl_renderer_export_query *export_query);
|
|
|
|
|
|
|
|
void vrend_sync_make_current(virgl_gl_context);
|
|
|
|
|
|
|
|
int
|
|
|
|
vrend_renderer_pipe_resource_create(struct vrend_context *ctx, uint32_t blob_id,
|
|
|
|
const struct vrend_renderer_resource_create_args *args);
|
|
|
|
|
|
|
|
struct pipe_resource *vrend_get_blob_pipe(struct vrend_context *ctx, uint64_t blob_id);
|
|
|
|
|
|
|
|
int vrend_renderer_resource_get_map_info(struct pipe_resource *pres, uint32_t *map_info);
|
|
|
|
|
|
|
|
int vrend_renderer_resource_map(struct pipe_resource *pres, void **map, uint64_t *out_size);
|
|
|
|
|
|
|
|
int vrend_renderer_resource_unmap(struct pipe_resource *pres);
|
|
|
|
|
|
|
|
#endif
|