1#ifndef __NV50_CONTEXT_H__ 2#define __NV50_CONTEXT_H__ 3 4#include "pipe/p_context.h" 5#include "pipe/p_defines.h" 6#include "pipe/p_state.h" 7 8#include "util/u_memory.h" 9#include "util/u_math.h" 10#include "util/u_inlines.h" 11#include "util/u_dynarray.h" 12 13#include "nv50/nv50_winsys.h" 14#include "nv50/nv50_stateobj.h" 15#include "nv50/nv50_screen.h" 16#include "nv50/nv50_program.h" 17#include "nv50/nv50_resource.h" 18#include "nv50/nv50_transfer.h" 19#include "nv50/nv50_query.h" 20 21#include "nouveau_context.h" 22#include "nouveau_debug.h" 23#include "nv_object.xml.h" 24#include "nv_m2mf.xml.h" 25#include "nv50/nv50_3ddefs.xml.h" 26#include "nv50/nv50_3d.xml.h" 27#include "nv50/nv50_2d.xml.h" 28#include "nv50/nv50_compute.xml.h" 29 30// NOTE: the VS/GS/FS order is based on how command methods are laid out for 31// TSC/TIC setting. 32#define NV50_SHADER_STAGE_VERTEX 0 33#define NV50_SHADER_STAGE_GEOMETRY 1 34#define NV50_SHADER_STAGE_FRAGMENT 2 35#define NV50_SHADER_STAGE_COMPUTE 3 36#define NV50_MAX_SHADER_STAGES 4 37 38#define NV50_MAX_3D_SHADER_STAGES 3 39 40#define NV50_NEW_3D_BLEND (1 << 0) 41#define NV50_NEW_3D_RASTERIZER (1 << 1) 42#define NV50_NEW_3D_ZSA (1 << 2) 43#define NV50_NEW_3D_VERTPROG (1 << 3) 44#define NV50_NEW_3D_GMTYPROG (1 << 6) 45#define NV50_NEW_3D_FRAGPROG (1 << 7) 46#define NV50_NEW_3D_BLEND_COLOUR (1 << 8) 47#define NV50_NEW_3D_STENCIL_REF (1 << 9) 48#define NV50_NEW_3D_CLIP (1 << 10) 49#define NV50_NEW_3D_SAMPLE_MASK (1 << 11) 50#define NV50_NEW_3D_FRAMEBUFFER (1 << 12) 51#define NV50_NEW_3D_STIPPLE (1 << 13) 52#define NV50_NEW_3D_SCISSOR (1 << 14) 53#define NV50_NEW_3D_VIEWPORT (1 << 15) 54#define NV50_NEW_3D_ARRAYS (1 << 16) 55#define NV50_NEW_3D_VERTEX (1 << 17) 56#define NV50_NEW_3D_CONSTBUF (1 << 18) 57#define NV50_NEW_3D_TEXTURES (1 << 19) 58#define NV50_NEW_3D_SAMPLERS (1 << 20) 59#define NV50_NEW_3D_STRMOUT (1 << 21) 60#define NV50_NEW_3D_MIN_SAMPLES (1 << 22) 61#define NV50_NEW_3D_WINDOW_RECTS (1 << 23) 62 63#define NV50_NEW_CP_PROGRAM (1 << 0) 64#define NV50_NEW_CP_SURFACES (1 << 1) 65#define NV50_NEW_CP_TEXTURES (1 << 2) 66#define NV50_NEW_CP_SAMPLERS (1 << 3) 67#define NV50_NEW_CP_CONSTBUF (1 << 4) 68#define NV50_NEW_CP_GLOBALS (1 << 5) 69#define NV50_NEW_CP_DRIVERCONST (1 << 6) 70#define NV50_NEW_CP_BUFFERS (1 << 7) 71 72/* 3d bufctx (during draw_vbo, blit_3d) */ 73#define NV50_BIND_3D_FB 0 74#define NV50_BIND_3D_VERTEX 1 75#define NV50_BIND_3D_VERTEX_TMP 2 76#define NV50_BIND_3D_INDEX 3 77#define NV50_BIND_3D_TEXTURES 4 78#define NV50_BIND_3D_CB(s, i) (5 + 16 * (s) + (i)) 79#define NV50_BIND_3D_SO 53 80#define NV50_BIND_3D_SCREEN 54 81#define NV50_BIND_3D_TLS 55 82#define NV50_BIND_3D_COUNT 56 83 84/* compute bufctx (during launch_grid) */ 85#define NV50_BIND_CP_CB(i) ( 0 + (i)) 86#define NV50_BIND_CP_TEXTURES 16 87#define NV50_BIND_CP_SUF 17 88#define NV50_BIND_CP_BUF 18 89#define NV50_BIND_CP_GLOBAL 19 90#define NV50_BIND_CP_SCREEN 20 91#define NV50_BIND_CP_QUERY 21 92#define NV50_BIND_CP_COUNT 22 93 94/* bufctx for other operations */ 95#define NV50_BIND_2D 0 96#define NV50_BIND_M2MF 0 97#define NV50_BIND_FENCE 1 98 99/* fixed constant buffer binding points - low indices for user's constbufs */ 100#define NV50_CB_PVP 123 101#define NV50_CB_PGP 124 102#define NV50_CB_PFP 125 103#define NV50_CB_PCP 126 104/* constant buffer permanently mapped in as c15[] */ 105#define NV50_CB_AUX 127 106/* size of the buffer: 64k. not all taken up, can be reduced if needed. */ 107#define NV50_CB_AUX_SIZE (1 << 16) 108/* 8 user clip planes, at 4 32-bit floats each */ 109#define NV50_CB_AUX_UCP_OFFSET 0x0000 110#define NV50_CB_AUX_UCP_SIZE (8 * 4 * 4) 111/* 16 textures * NV50_MAX_SHADER_STAGES shaders, each with ms_x, ms_y u32 pairs */ 112#define NV50_CB_AUX_TEX_MS_OFFSET 0x0080 113#define NV50_CB_AUX_TEX_MS_SIZE (16 * NV50_MAX_SHADER_STAGES * 2 * 4) 114/* For each MS level (4), 8 sets of 32-bit integer pairs sample offsets */ 115#define NV50_CB_AUX_MS_OFFSET 0x280 116#define NV50_CB_AUX_MS_SIZE (4 * 8 * 4 * 2) 117/* Sample position pairs for the current output MS level */ 118#define NV50_CB_AUX_SAMPLE_OFFSET 0x380 119#define NV50_CB_AUX_SAMPLE_OFFSET_SIZE (4 * 8 * 2) 120/* Alpha test ref value */ 121#define NV50_CB_AUX_ALPHATEST_OFFSET 0x3c0 122#define NV50_CB_AUX_ALPHATEST_SIZE (4) 123/* Compute buffer info: 16 surfaces, 12 32-bit integers each */ 124#define NV50_CB_AUX_BUF_INFO(i) (0x3c4 + (i) * 12 * 4) 125#define NV50_CB_AUX_BUF_SIZE (NV50_MAX_GLOBALS * 12 * 4) 126/* Compute membar mapped area */ 127#define NV50_CB_AUX_MEMBAR_OFFSET 0x6c4 128/* next spot: 0x6c8 */ 129/* 0x800 from the end for compute shader membars, reads only. */ 130#define NV50_CB_AUX_MEMBAR (NV50_CB_AUX_SIZE - 0x800) 131/* 4 32-bit floats for the vertex runout, put at the end */ 132#define NV50_CB_AUX_RUNOUT_OFFSET (NV50_CB_AUX_SIZE - 0x10) 133 134 135 136struct nv50_blitctx; 137 138bool nv50_blitctx_create(struct nv50_context *); 139 140struct nv50_context { 141 struct nouveau_context base; 142 143 struct nv50_screen *screen; 144 145 struct nouveau_bufctx *bufctx_3d; 146 struct nouveau_bufctx *bufctx; 147 struct nouveau_bufctx *bufctx_cp; 148 149 uint32_t dirty_3d; /* dirty flags for 3d state */ 150 uint32_t dirty_cp; /* dirty flags for compute state */ 151 bool cb_dirty; 152 153 struct nv50_graph_state state; 154 155 struct nv50_blend_stateobj *blend; 156 struct nv50_rasterizer_stateobj *rast; 157 struct nv50_zsa_stateobj *zsa; 158 struct nv50_vertex_stateobj *vertex; 159 160 struct nv50_program *vertprog; 161 struct nv50_program *gmtyprog; 162 struct nv50_program *fragprog; 163 struct nv50_program *compprog; 164 165 struct nv50_constbuf constbuf[NV50_MAX_SHADER_STAGES][NV50_MAX_PIPE_CONSTBUFS]; 166 uint16_t constbuf_dirty[NV50_MAX_SHADER_STAGES]; 167 uint16_t constbuf_valid[NV50_MAX_SHADER_STAGES]; 168 uint16_t constbuf_coherent[NV50_MAX_SHADER_STAGES]; 169 170 struct pipe_vertex_buffer vtxbuf[PIPE_MAX_ATTRIBS]; 171 unsigned num_vtxbufs; 172 uint32_t vtxbufs_coherent; 173 uint32_t vbo_fifo; /* bitmask of vertex elements to be pushed to FIFO */ 174 uint32_t vbo_user; /* bitmask of vertex buffers pointing to user memory */ 175 uint32_t vbo_constant; /* bitmask of user buffers with stride 0 */ 176 uint32_t vb_elt_first; /* from pipe_draw_info, for vertex upload */ 177 uint32_t vb_elt_limit; /* max - min element (count - 1) */ 178 uint32_t instance_off; /* base vertex for instanced arrays */ 179 uint32_t instance_max; /* max instance for current draw call */ 180 181 struct pipe_sampler_view *textures[NV50_MAX_SHADER_STAGES][PIPE_MAX_SAMPLERS]; 182 unsigned num_textures[NV50_MAX_SHADER_STAGES]; 183 uint32_t textures_coherent[NV50_MAX_SHADER_STAGES]; 184 struct nv50_tsc_entry *samplers[NV50_MAX_SHADER_STAGES][PIPE_MAX_SAMPLERS]; 185 unsigned num_samplers[NV50_MAX_SHADER_STAGES]; 186 bool seamless_cube_map; 187 188 uint8_t num_so_targets; 189 uint8_t so_targets_dirty; 190 struct pipe_stream_output_target *so_target[4]; 191 /* keeps track of how much of an SO is used. normally this doesn't work in 192 * the presence of GS, but this only needs to work for ES 3.0 which doesn't 193 * have GS or any other oddities. only used pre-NVA0. 194 */ 195 uint32_t so_used[4]; 196 197 struct pipe_framebuffer_state framebuffer; 198 struct pipe_blend_color blend_colour; 199 struct pipe_stencil_ref stencil_ref; 200 struct pipe_poly_stipple stipple; 201 struct pipe_scissor_state scissors[NV50_MAX_VIEWPORTS]; 202 unsigned scissors_dirty; 203 struct pipe_viewport_state viewports[NV50_MAX_VIEWPORTS]; 204 unsigned viewports_dirty; 205 struct pipe_clip_state clip; 206 struct nv50_window_rect_stateobj window_rect; 207 208 unsigned sample_mask; 209 unsigned min_samples; 210 211 bool vbo_push_hint; 212 213 uint32_t rt_array_mode; 214 215 struct pipe_query *cond_query; 216 bool cond_cond; /* inverted rendering condition */ 217 uint cond_mode; 218 uint32_t cond_condmode; /* the calculated condition */ 219 220 struct nv50_blitctx *blit; 221 222 /* compute stage only */ 223 struct pipe_shader_buffer buffers[NV50_MAX_GLOBALS]; 224 uint16_t buffers_dirty; 225 uint16_t buffers_valid; 226 227 struct pipe_image_view images[NV50_MAX_GLOBALS]; 228 uint16_t images_dirty; 229 uint16_t images_valid; 230 231 struct util_dynarray global_residents; 232 233 uint64_t compute_invocations; 234}; 235 236static inline struct nv50_context * 237nv50_context(struct pipe_context *pipe) 238{ 239 return (struct nv50_context *)pipe; 240} 241 242/* return index used in nv50_context arrays for a specific shader type */ 243static inline unsigned 244nv50_context_shader_stage(unsigned pipe) 245{ 246 switch (pipe) { 247 case PIPE_SHADER_VERTEX: return NV50_SHADER_STAGE_VERTEX; 248 case PIPE_SHADER_FRAGMENT: return NV50_SHADER_STAGE_FRAGMENT; 249 case PIPE_SHADER_GEOMETRY: return NV50_SHADER_STAGE_GEOMETRY; 250 case PIPE_SHADER_COMPUTE: return NV50_SHADER_STAGE_COMPUTE; 251 default: 252 assert(!"invalid/unhandled shader type"); 253 return 0; 254 } 255} 256 257/* nv50_context.c */ 258struct pipe_context *nv50_create(struct pipe_screen *, void *, unsigned flags); 259 260void nv50_bufctx_fence(struct nouveau_bufctx *, bool on_flush); 261 262void nv50_default_kick_notify(struct nouveau_pushbuf *); 263 264/* nv50_draw.c */ 265extern struct draw_stage *nv50_draw_render_stage(struct nv50_context *); 266 267/* nv50_shader_state.c */ 268void nv50_vertprog_validate(struct nv50_context *); 269void nv50_gmtyprog_validate(struct nv50_context *); 270void nv50_fragprog_validate(struct nv50_context *); 271void nv50_compprog_validate(struct nv50_context *); 272void nv50_fp_linkage_validate(struct nv50_context *); 273void nv50_gp_linkage_validate(struct nv50_context *); 274void nv50_constbufs_validate(struct nv50_context *); 275void nv50_validate_derived_rs(struct nv50_context *); 276void nv50_stream_output_validate(struct nv50_context *); 277 278/* nv50_state.c */ 279extern void nv50_init_state_functions(struct nv50_context *); 280 281/* nv50_state_validate.c */ 282struct nv50_state_validate { 283 void (*func)(struct nv50_context *); 284 uint32_t states; 285}; 286 287bool nv50_state_validate(struct nv50_context *, uint32_t, 288 struct nv50_state_validate *, int, uint32_t *, 289 struct nouveau_bufctx *); 290bool nv50_state_validate_3d(struct nv50_context *, uint32_t); 291 292/* nv50_surface.c */ 293extern void nv50_clear(struct pipe_context *, unsigned buffers, 294 const struct pipe_scissor_state *scissor_state, 295 const union pipe_color_union *color, 296 double depth, unsigned stencil); 297extern void nv50_init_surface_functions(struct nv50_context *); 298 299/* nv50_tex.c */ 300bool nv50_validate_tic(struct nv50_context *nv50, int s); 301void nv50_validate_textures(struct nv50_context *); 302bool nv50_validate_tsc(struct nv50_context *nv50, int s); 303void nv50_validate_samplers(struct nv50_context *); 304void nv50_upload_ms_info(struct nouveau_pushbuf *); 305void nv50_upload_tsc0(struct nv50_context *); 306 307struct pipe_sampler_view * 308nv50_create_texture_view(struct pipe_context *, 309 struct pipe_resource *, 310 const struct pipe_sampler_view *, 311 uint32_t flags); 312struct pipe_sampler_view * 313nv50_create_sampler_view(struct pipe_context *, 314 struct pipe_resource *, 315 const struct pipe_sampler_view *); 316 317/* nv50_transfer.c */ 318void 319nv50_m2mf_transfer_rect(struct nv50_context *, 320 const struct nv50_m2mf_rect *dst, 321 const struct nv50_m2mf_rect *src, 322 uint32_t nblocksx, uint32_t nblocksy); 323void 324nv50_sifc_linear_u8(struct nouveau_context *pipe, 325 struct nouveau_bo *dst, unsigned offset, unsigned domain, 326 unsigned size, const void *data); 327void 328nv50_m2mf_copy_linear(struct nouveau_context *pipe, 329 struct nouveau_bo *dst, unsigned dstoff, unsigned dstdom, 330 struct nouveau_bo *src, unsigned srcoff, unsigned srcdom, 331 unsigned size); 332void 333nv50_cb_push(struct nouveau_context *nv, 334 struct nv04_resource *res, 335 unsigned offset, unsigned words, const uint32_t *data); 336 337/* nv50_vbo.c */ 338void nv50_draw_vbo(struct pipe_context *, const struct pipe_draw_info *, unsigned, 339 const struct pipe_draw_indirect_info *indirect, 340 const struct pipe_draw_start_count_bias *draws, 341 unsigned num_draws); 342 343void * 344nv50_vertex_state_create(struct pipe_context *pipe, 345 unsigned num_elements, 346 const struct pipe_vertex_element *elements); 347void 348nv50_vertex_state_delete(struct pipe_context *pipe, void *hwcso); 349 350void nv50_vertex_arrays_validate(struct nv50_context *nv50); 351 352/* nv50_push.c */ 353void nv50_push_vbo(struct nv50_context *, const struct pipe_draw_info *, 354 const struct pipe_draw_indirect_info *indirect, 355 const struct pipe_draw_start_count_bias *draw); 356 357/* nv84_video.c */ 358struct pipe_video_codec * 359nv84_create_decoder(struct pipe_context *context, 360 const struct pipe_video_codec *templ); 361 362struct pipe_video_buffer * 363nv84_video_buffer_create(struct pipe_context *pipe, 364 const struct pipe_video_buffer *template); 365 366int 367nv84_screen_get_video_param(struct pipe_screen *pscreen, 368 enum pipe_video_profile profile, 369 enum pipe_video_entrypoint entrypoint, 370 enum pipe_video_cap param); 371 372bool 373nv84_screen_video_supported(struct pipe_screen *screen, 374 enum pipe_format format, 375 enum pipe_video_profile profile, 376 enum pipe_video_entrypoint entrypoint); 377 378/* nv98_video.c */ 379struct pipe_video_codec * 380nv98_create_decoder(struct pipe_context *context, 381 const struct pipe_video_codec *templ); 382 383struct pipe_video_buffer * 384nv98_video_buffer_create(struct pipe_context *pipe, 385 const struct pipe_video_buffer *template); 386 387/* nv50_compute.c */ 388void 389nv50_launch_grid(struct pipe_context *, const struct pipe_grid_info *); 390 391#endif 392