2
* Copyright (C) 2016 Rob Clark <robclark@freedesktop.org>
4
* Permission is hereby granted, free of charge, to any person obtaining a
5
* copy of this software and associated documentation files (the "Software"),
6
* to deal in the Software without restriction, including without limitation
7
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
8
* and/or sell copies of the Software, and to permit persons to whom the
9
* Software is furnished to do so, subject to the following conditions:
11
* The above copyright notice and this permission notice (including the next
12
* paragraph) shall be included in all copies or substantial portions of the
15
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24
* Rob Clark <robclark@freedesktop.org>
27
#include "pipe/p_state.h"
28
#include "util/format/u_format.h"
29
#include "util/u_inlines.h"
30
#include "util/u_memory.h"
31
#include "util/u_string.h"
33
#include "freedreno_draw.h"
34
#include "freedreno_resource.h"
35
#include "freedreno_state.h"
37
#include "fd5_context.h"
40
#include "fd5_format.h"
42
#include "fd5_program.h"
46
emit_mrt(struct fd_ringbuffer *ring, unsigned nr_bufs,
47
struct pipe_surface **bufs, const struct fd_gmem_stateobj *gmem)
49
enum a5xx_tile_mode tile_mode;
52
for (i = 0; i < A5XX_MAX_RENDER_TARGETS; i++) {
53
enum a5xx_color_fmt format = 0;
54
enum a3xx_color_swap swap = WZYX;
55
bool srgb = false, sint = false, uint = false;
56
struct fd_resource *rsc = NULL;
65
tile_mode = TILE5_LINEAR;
68
if ((i < nr_bufs) && bufs[i]) {
69
struct pipe_surface *psurf = bufs[i];
70
enum pipe_format pformat = psurf->format;
72
rsc = fd_resource(psurf->texture);
74
format = fd5_pipe2color(pformat);
75
swap = fd5_pipe2swap(pformat);
76
srgb = util_format_is_srgb(pformat);
77
sint = util_format_is_pure_sint(pformat);
78
uint = util_format_is_pure_uint(pformat);
80
debug_assert(psurf->u.tex.first_layer == psurf->u.tex.last_layer);
82
offset = fd_resource_offset(rsc, psurf->u.tex.level,
83
psurf->u.tex.first_layer);
86
stride = gmem->bin_w * gmem->cbuf_cpp[i];
87
size = stride * gmem->bin_h;
88
base = gmem->cbuf_base[i];
90
stride = fd_resource_pitch(rsc, psurf->u.tex.level);
91
size = fd_resource_layer_stride(rsc, psurf->u.tex.level);
94
fd_resource_tile_mode(psurf->texture, psurf->u.tex.level);
98
OUT_PKT4(ring, REG_A5XX_RB_MRT_BUF_INFO(i), 5);
101
A5XX_RB_MRT_BUF_INFO_COLOR_FORMAT(format) |
102
A5XX_RB_MRT_BUF_INFO_COLOR_TILE_MODE(tile_mode) |
103
A5XX_RB_MRT_BUF_INFO_COLOR_SWAP(swap) |
105
0x800) | /* XXX 0x1000 for RECTLIST clear, 0x0 for BLIT.. */
106
COND(srgb, A5XX_RB_MRT_BUF_INFO_COLOR_SRGB));
107
OUT_RING(ring, A5XX_RB_MRT_PITCH(stride));
108
OUT_RING(ring, A5XX_RB_MRT_ARRAY_PITCH(size));
109
if (gmem || (i >= nr_bufs) || !bufs[i]) {
110
OUT_RING(ring, base); /* RB_MRT[i].BASE_LO */
111
OUT_RING(ring, 0x00000000); /* RB_MRT[i].BASE_HI */
113
OUT_RELOC(ring, rsc->bo, offset, 0, 0); /* BASE_LO/HI */
116
OUT_PKT4(ring, REG_A5XX_SP_FS_MRT_REG(i), 1);
117
OUT_RING(ring, A5XX_SP_FS_MRT_REG_COLOR_FORMAT(format) |
118
COND(sint, A5XX_SP_FS_MRT_REG_COLOR_SINT) |
119
COND(uint, A5XX_SP_FS_MRT_REG_COLOR_UINT) |
120
COND(srgb, A5XX_SP_FS_MRT_REG_COLOR_SRGB));
122
/* when we support UBWC, these would be the system memory
125
OUT_PKT4(ring, REG_A5XX_RB_MRT_FLAG_BUFFER(i), 4);
126
OUT_RING(ring, 0x00000000); /* RB_MRT_FLAG_BUFFER[i].ADDR_LO */
127
OUT_RING(ring, 0x00000000); /* RB_MRT_FLAG_BUFFER[i].ADDR_HI */
128
OUT_RING(ring, A5XX_RB_MRT_FLAG_BUFFER_PITCH(0));
129
OUT_RING(ring, A5XX_RB_MRT_FLAG_BUFFER_ARRAY_PITCH(0));
134
emit_zs(struct fd_ringbuffer *ring, struct pipe_surface *zsbuf,
135
const struct fd_gmem_stateobj *gmem)
138
struct fd_resource *rsc = fd_resource(zsbuf->texture);
139
enum a5xx_depth_format fmt = fd5_pipe2depth(zsbuf->format);
140
uint32_t cpp = rsc->layout.cpp;
145
stride = cpp * gmem->bin_w;
146
size = stride * gmem->bin_h;
148
stride = fd_resource_pitch(rsc, zsbuf->u.tex.level);
149
size = fd_resource_layer_stride(rsc, zsbuf->u.tex.level);
152
OUT_PKT4(ring, REG_A5XX_RB_DEPTH_BUFFER_INFO, 5);
153
OUT_RING(ring, A5XX_RB_DEPTH_BUFFER_INFO_DEPTH_FORMAT(fmt));
155
OUT_RING(ring, gmem->zsbuf_base[0]); /* RB_DEPTH_BUFFER_BASE_LO */
156
OUT_RING(ring, 0x00000000); /* RB_DEPTH_BUFFER_BASE_HI */
158
OUT_RELOC(ring, rsc->bo,
159
fd_resource_offset(rsc, zsbuf->u.tex.level, zsbuf->u.tex.first_layer),
160
0, 0); /* RB_DEPTH_BUFFER_BASE_LO/HI */
162
OUT_RING(ring, A5XX_RB_DEPTH_BUFFER_PITCH(stride));
163
OUT_RING(ring, A5XX_RB_DEPTH_BUFFER_ARRAY_PITCH(size));
165
OUT_PKT4(ring, REG_A5XX_GRAS_SU_DEPTH_BUFFER_INFO, 1);
166
OUT_RING(ring, A5XX_GRAS_SU_DEPTH_BUFFER_INFO_DEPTH_FORMAT(fmt));
168
OUT_PKT4(ring, REG_A5XX_RB_DEPTH_FLAG_BUFFER_BASE_LO, 3);
169
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_BASE_LO */
170
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_BASE_HI */
171
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_PITCH */
174
OUT_PKT4(ring, REG_A5XX_GRAS_LRZ_BUFFER_BASE_LO, 3);
175
OUT_RELOC(ring, rsc->lrz, 0x1000, 0, 0);
176
OUT_RING(ring, A5XX_GRAS_LRZ_BUFFER_PITCH(rsc->lrz_pitch));
178
OUT_PKT4(ring, REG_A5XX_GRAS_LRZ_FAST_CLEAR_BUFFER_BASE_LO, 2);
179
OUT_RELOC(ring, rsc->lrz, 0, 0, 0);
181
OUT_PKT4(ring, REG_A5XX_GRAS_LRZ_BUFFER_BASE_LO, 3);
182
OUT_RING(ring, 0x00000000);
183
OUT_RING(ring, 0x00000000);
184
OUT_RING(ring, 0x00000000); /* GRAS_LRZ_BUFFER_PITCH */
186
OUT_PKT4(ring, REG_A5XX_GRAS_LRZ_FAST_CLEAR_BUFFER_BASE_LO, 2);
187
OUT_RING(ring, 0x00000000);
188
OUT_RING(ring, 0x00000000);
193
stride = 1 * gmem->bin_w;
194
size = stride * gmem->bin_h;
196
stride = fd_resource_pitch(rsc->stencil, zsbuf->u.tex.level);
197
size = fd_resource_layer_stride(rsc, zsbuf->u.tex.level);
200
OUT_PKT4(ring, REG_A5XX_RB_STENCIL_INFO, 5);
201
OUT_RING(ring, A5XX_RB_STENCIL_INFO_SEPARATE_STENCIL);
203
OUT_RING(ring, gmem->zsbuf_base[1]); /* RB_STENCIL_BASE_LO */
204
OUT_RING(ring, 0x00000000); /* RB_STENCIL_BASE_HI */
206
OUT_RELOC(ring, rsc->stencil->bo,
207
fd_resource_offset(rsc->stencil, zsbuf->u.tex.level, zsbuf->u.tex.first_layer),
208
0, 0); /* RB_STENCIL_BASE_LO/HI */
210
OUT_RING(ring, A5XX_RB_STENCIL_PITCH(stride));
211
OUT_RING(ring, A5XX_RB_STENCIL_ARRAY_PITCH(size));
213
OUT_PKT4(ring, REG_A5XX_RB_STENCIL_INFO, 1);
214
OUT_RING(ring, 0x00000000); /* RB_STENCIL_INFO */
217
OUT_PKT4(ring, REG_A5XX_RB_DEPTH_BUFFER_INFO, 5);
218
OUT_RING(ring, A5XX_RB_DEPTH_BUFFER_INFO_DEPTH_FORMAT(DEPTH5_NONE));
219
OUT_RING(ring, 0x00000000); /* RB_DEPTH_BUFFER_BASE_LO */
220
OUT_RING(ring, 0x00000000); /* RB_DEPTH_BUFFER_BASE_HI */
221
OUT_RING(ring, 0x00000000); /* RB_DEPTH_BUFFER_PITCH */
222
OUT_RING(ring, 0x00000000); /* RB_DEPTH_BUFFER_ARRAY_PITCH */
224
OUT_PKT4(ring, REG_A5XX_GRAS_SU_DEPTH_BUFFER_INFO, 1);
225
OUT_RING(ring, A5XX_GRAS_SU_DEPTH_BUFFER_INFO_DEPTH_FORMAT(DEPTH5_NONE));
227
OUT_PKT4(ring, REG_A5XX_RB_DEPTH_FLAG_BUFFER_BASE_LO, 3);
228
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_BASE_LO */
229
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_BASE_HI */
230
OUT_RING(ring, 0x00000000); /* RB_DEPTH_FLAG_BUFFER_PITCH */
232
OUT_PKT4(ring, REG_A5XX_RB_STENCIL_INFO, 1);
233
OUT_RING(ring, 0x00000000); /* RB_STENCIL_INFO */
238
emit_msaa(struct fd_ringbuffer *ring, uint32_t nr_samples)
240
enum a3xx_msaa_samples samples = fd_msaa_samples(nr_samples);
242
OUT_PKT4(ring, REG_A5XX_TPL1_TP_RAS_MSAA_CNTL, 2);
243
OUT_RING(ring, A5XX_TPL1_TP_RAS_MSAA_CNTL_SAMPLES(samples));
244
OUT_RING(ring, A5XX_TPL1_TP_DEST_MSAA_CNTL_SAMPLES(samples) |
245
COND(samples == MSAA_ONE,
246
A5XX_TPL1_TP_DEST_MSAA_CNTL_MSAA_DISABLE));
248
OUT_PKT4(ring, REG_A5XX_RB_RAS_MSAA_CNTL, 2);
249
OUT_RING(ring, A5XX_RB_RAS_MSAA_CNTL_SAMPLES(samples));
251
A5XX_RB_DEST_MSAA_CNTL_SAMPLES(samples) |
252
COND(samples == MSAA_ONE, A5XX_RB_DEST_MSAA_CNTL_MSAA_DISABLE));
254
OUT_PKT4(ring, REG_A5XX_GRAS_SC_RAS_MSAA_CNTL, 2);
255
OUT_RING(ring, A5XX_GRAS_SC_RAS_MSAA_CNTL_SAMPLES(samples));
256
OUT_RING(ring, A5XX_GRAS_SC_DEST_MSAA_CNTL_SAMPLES(samples) |
257
COND(samples == MSAA_ONE,
258
A5XX_GRAS_SC_DEST_MSAA_CNTL_MSAA_DISABLE));
262
use_hw_binning(struct fd_batch *batch)
264
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
266
if ((gmem->maxpw * gmem->maxph) > 32)
269
if ((gmem->maxpw > 15) || (gmem->maxph > 15))
272
return fd_binning_enabled && ((gmem->nbins_x * gmem->nbins_y) > 2) &&
273
(batch->num_draws > 0);
277
patch_draws(struct fd_batch *batch, enum pc_di_vis_cull_mode vismode)
280
for (i = 0; i < fd_patch_num_elements(&batch->draw_patches); i++) {
281
struct fd_cs_patch *patch = fd_patch_element(&batch->draw_patches, i);
282
*patch->cs = patch->val | DRAW4(0, 0, 0, vismode);
284
util_dynarray_clear(&batch->draw_patches);
288
update_vsc_pipe(struct fd_batch *batch) assert_dt
290
struct fd_context *ctx = batch->ctx;
291
struct fd5_context *fd5_ctx = fd5_context(ctx);
292
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
293
struct fd_ringbuffer *ring = batch->gmem;
296
OUT_PKT4(ring, REG_A5XX_VSC_BIN_SIZE, 3);
297
OUT_RING(ring, A5XX_VSC_BIN_SIZE_WIDTH(gmem->bin_w) |
298
A5XX_VSC_BIN_SIZE_HEIGHT(gmem->bin_h));
299
OUT_RELOC(ring, fd5_ctx->vsc_size_mem, 0, 0, 0); /* VSC_SIZE_ADDRESS_LO/HI */
301
OUT_PKT4(ring, REG_A5XX_UNKNOWN_0BC5, 2);
302
OUT_RING(ring, 0x00000000); /* UNKNOWN_0BC5 */
303
OUT_RING(ring, 0x00000000); /* UNKNOWN_0BC6 */
305
OUT_PKT4(ring, REG_A5XX_VSC_PIPE_CONFIG_REG(0), 16);
306
for (i = 0; i < 16; i++) {
307
const struct fd_vsc_pipe *pipe = &gmem->vsc_pipe[i];
308
OUT_RING(ring, A5XX_VSC_PIPE_CONFIG_REG_X(pipe->x) |
309
A5XX_VSC_PIPE_CONFIG_REG_Y(pipe->y) |
310
A5XX_VSC_PIPE_CONFIG_REG_W(pipe->w) |
311
A5XX_VSC_PIPE_CONFIG_REG_H(pipe->h));
314
OUT_PKT4(ring, REG_A5XX_VSC_PIPE_DATA_ADDRESS_LO(0), 32);
315
for (i = 0; i < 16; i++) {
316
if (!ctx->vsc_pipe_bo[i]) {
317
ctx->vsc_pipe_bo[i] = fd_bo_new(
318
ctx->dev, 0x20000, 0, "vsc_pipe[%u]", i);
320
OUT_RELOC(ring, ctx->vsc_pipe_bo[i], 0, 0,
321
0); /* VSC_PIPE_DATA_ADDRESS[i].LO/HI */
324
OUT_PKT4(ring, REG_A5XX_VSC_PIPE_DATA_LENGTH_REG(0), 16);
325
for (i = 0; i < 16; i++) {
326
OUT_RING(ring, fd_bo_size(ctx->vsc_pipe_bo[i]) -
327
32); /* VSC_PIPE_DATA_LENGTH[i] */
332
emit_binning_pass(struct fd_batch *batch) assert_dt
334
struct fd_ringbuffer *ring = batch->gmem;
335
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
337
uint32_t x1 = gmem->minx;
338
uint32_t y1 = gmem->miny;
339
uint32_t x2 = gmem->minx + gmem->width - 1;
340
uint32_t y2 = gmem->miny + gmem->height - 1;
342
fd5_set_render_mode(batch->ctx, ring, BINNING);
344
OUT_PKT4(ring, REG_A5XX_RB_CNTL, 1);
346
A5XX_RB_CNTL_WIDTH(gmem->bin_w) | A5XX_RB_CNTL_HEIGHT(gmem->bin_h));
348
OUT_PKT4(ring, REG_A5XX_GRAS_SC_WINDOW_SCISSOR_TL, 2);
349
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_TL_X(x1) |
350
A5XX_GRAS_SC_WINDOW_SCISSOR_TL_Y(y1));
351
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_BR_X(x2) |
352
A5XX_GRAS_SC_WINDOW_SCISSOR_BR_Y(y2));
354
OUT_PKT4(ring, REG_A5XX_RB_RESOLVE_CNTL_1, 2);
355
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_1_X(x1) | A5XX_RB_RESOLVE_CNTL_1_Y(y1));
356
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_2_X(x2) | A5XX_RB_RESOLVE_CNTL_2_Y(y2));
358
update_vsc_pipe(batch);
360
OUT_PKT4(ring, REG_A5XX_VPC_MODE_CNTL, 1);
361
OUT_RING(ring, A5XX_VPC_MODE_CNTL_BINNING_PASS);
363
fd5_event_write(batch, ring, UNK_2C, false);
365
OUT_PKT4(ring, REG_A5XX_RB_WINDOW_OFFSET, 1);
366
OUT_RING(ring, A5XX_RB_WINDOW_OFFSET_X(0) | A5XX_RB_WINDOW_OFFSET_Y(0));
368
/* emit IB to binning drawcmds: */
369
fd5_emit_ib(ring, batch->binning);
373
fd5_event_write(batch, ring, UNK_2D, false);
375
fd5_event_write(batch, ring, CACHE_FLUSH_TS, true);
377
// TODO CP_COND_WRITE's for all the vsc buffers (check for overflow??)
381
OUT_PKT4(ring, REG_A5XX_VPC_MODE_CNTL, 1);
385
/* before first tile */
387
fd5_emit_tile_init(struct fd_batch *batch) assert_dt
389
struct fd_ringbuffer *ring = batch->gmem;
390
struct pipe_framebuffer_state *pfb = &batch->framebuffer;
392
fd5_emit_restore(batch, ring);
395
fd5_emit_ib(ring, batch->prologue);
397
fd5_emit_lrz_flush(batch, ring);
399
OUT_PKT4(ring, REG_A5XX_GRAS_CL_CNTL, 1);
400
OUT_RING(ring, 0x00000080); /* GRAS_CL_CNTL */
402
OUT_PKT7(ring, CP_SKIP_IB2_ENABLE_GLOBAL, 1);
405
OUT_PKT4(ring, REG_A5XX_PC_POWER_CNTL, 1);
406
OUT_RING(ring, 0x00000003); /* PC_POWER_CNTL */
408
OUT_PKT4(ring, REG_A5XX_VFD_POWER_CNTL, 1);
409
OUT_RING(ring, 0x00000003); /* VFD_POWER_CNTL */
411
/* 0x10000000 for BYPASS.. 0x7c13c080 for GMEM: */
413
OUT_PKT4(ring, REG_A5XX_RB_CCU_CNTL, 1);
414
OUT_RING(ring, 0x7c13c080); /* RB_CCU_CNTL */
416
emit_zs(ring, pfb->zsbuf, batch->gmem_state);
417
emit_mrt(ring, pfb->nr_cbufs, pfb->cbufs, batch->gmem_state);
419
/* Enable stream output for the first pass (likely the binning). */
420
OUT_PKT4(ring, REG_A5XX_VPC_SO_OVERRIDE, 1);
423
if (use_hw_binning(batch)) {
424
emit_binning_pass(batch);
426
/* Disable stream output after binning, since each VS output should get
429
OUT_PKT4(ring, REG_A5XX_VPC_SO_OVERRIDE, 1);
430
OUT_RING(ring, A5XX_VPC_SO_OVERRIDE_SO_DISABLE);
432
fd5_emit_lrz_flush(batch, ring);
433
patch_draws(batch, USE_VISIBILITY);
435
patch_draws(batch, IGNORE_VISIBILITY);
438
fd5_set_render_mode(batch->ctx, ring, GMEM);
440
/* XXX If we're in gmem mode but not doing HW binning, then after the first
441
* tile we should disable stream output (fd6_gmem.c doesn't do that either).
445
/* before mem2gmem */
447
fd5_emit_tile_prep(struct fd_batch *batch, const struct fd_tile *tile) assert_dt
449
struct fd_context *ctx = batch->ctx;
450
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
451
struct fd5_context *fd5_ctx = fd5_context(ctx);
452
struct fd_ringbuffer *ring = batch->gmem;
454
uint32_t x1 = tile->xoff;
455
uint32_t y1 = tile->yoff;
456
uint32_t x2 = tile->xoff + tile->bin_w - 1;
457
uint32_t y2 = tile->yoff + tile->bin_h - 1;
459
OUT_PKT4(ring, REG_A5XX_GRAS_SC_WINDOW_SCISSOR_TL, 2);
460
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_TL_X(x1) |
461
A5XX_GRAS_SC_WINDOW_SCISSOR_TL_Y(y1));
462
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_BR_X(x2) |
463
A5XX_GRAS_SC_WINDOW_SCISSOR_BR_Y(y2));
465
OUT_PKT4(ring, REG_A5XX_RB_RESOLVE_CNTL_1, 2);
466
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_1_X(x1) | A5XX_RB_RESOLVE_CNTL_1_Y(y1));
467
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_2_X(x2) | A5XX_RB_RESOLVE_CNTL_2_Y(y2));
469
if (use_hw_binning(batch)) {
470
const struct fd_vsc_pipe *pipe = &gmem->vsc_pipe[tile->p];
471
struct fd_bo *pipe_bo = ctx->vsc_pipe_bo[tile->p];
473
OUT_PKT7(ring, CP_WAIT_FOR_ME, 0);
475
OUT_PKT7(ring, CP_SET_VISIBILITY_OVERRIDE, 1);
478
OUT_PKT7(ring, CP_SET_BIN_DATA5, 5);
479
OUT_RING(ring, CP_SET_BIN_DATA5_0_VSC_SIZE(pipe->w * pipe->h) |
480
CP_SET_BIN_DATA5_0_VSC_N(tile->n));
481
OUT_RELOC(ring, pipe_bo, 0, 0, 0); /* VSC_PIPE[p].DATA_ADDRESS */
482
OUT_RELOC(ring, fd5_ctx->vsc_size_mem, /* VSC_SIZE_ADDRESS + (p * 4) */
483
(tile->p * 4), 0, 0);
485
OUT_PKT7(ring, CP_SET_VISIBILITY_OVERRIDE, 1);
489
OUT_PKT4(ring, REG_A5XX_RB_WINDOW_OFFSET, 1);
490
OUT_RING(ring, A5XX_RB_WINDOW_OFFSET_X(x1) | A5XX_RB_WINDOW_OFFSET_Y(y1));
494
* transfer from system memory to gmem
498
emit_mem2gmem_surf(struct fd_batch *batch, uint32_t base,
499
struct pipe_surface *psurf, enum a5xx_blit_buf buf)
501
struct fd_ringbuffer *ring = batch->gmem;
502
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
503
struct fd_resource *rsc = fd_resource(psurf->texture);
504
uint32_t stride, size;
506
debug_assert(psurf->u.tex.first_layer == psurf->u.tex.last_layer);
511
if ((buf == BLIT_ZS) || (buf == BLIT_S)) {
512
// XXX hack import via BLIT_MRT0 instead of BLIT_ZS, since I don't
513
// know otherwise how to go from linear in sysmem to tiled in gmem.
514
// possibly we want to flip this around gmem2mem and keep depth
515
// tiled in sysmem (and fixup sampler state to assume tiled).. this
516
// might be required for doing depth/stencil in bypass mode?
517
enum a5xx_color_fmt format =
518
fd5_pipe2color(fd_gmem_restore_format(rsc->b.b.format));
520
OUT_PKT4(ring, REG_A5XX_RB_MRT_BUF_INFO(0), 5);
522
A5XX_RB_MRT_BUF_INFO_COLOR_FORMAT(format) |
523
A5XX_RB_MRT_BUF_INFO_COLOR_TILE_MODE(rsc->layout.tile_mode) |
524
A5XX_RB_MRT_BUF_INFO_COLOR_SWAP(WZYX));
525
OUT_RING(ring, A5XX_RB_MRT_PITCH(fd_resource_pitch(rsc, psurf->u.tex.level)));
526
OUT_RING(ring, A5XX_RB_MRT_ARRAY_PITCH(fd_resource_layer_stride(rsc, psurf->u.tex.level)));
527
OUT_RELOC(ring, rsc->bo,
528
fd_resource_offset(rsc, psurf->u.tex.level, psurf->u.tex.first_layer),
529
0, 0); /* BASE_LO/HI */
534
stride = gmem->bin_w << fdl_cpp_shift(&rsc->layout);
535
size = stride * gmem->bin_h;
537
OUT_PKT4(ring, REG_A5XX_RB_BLIT_FLAG_DST_LO, 4);
538
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_LO */
539
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_HI */
540
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_PITCH */
541
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_ARRAY_PITCH */
543
OUT_PKT4(ring, REG_A5XX_RB_RESOLVE_CNTL_3, 5);
544
OUT_RING(ring, 0x00000000); /* RB_RESOLVE_CNTL_3 */
545
OUT_RING(ring, base); /* RB_BLIT_DST_LO */
546
OUT_RING(ring, 0x00000000); /* RB_BLIT_DST_HI */
547
OUT_RING(ring, A5XX_RB_BLIT_DST_PITCH(stride));
548
OUT_RING(ring, A5XX_RB_BLIT_DST_ARRAY_PITCH(size));
550
OUT_PKT4(ring, REG_A5XX_RB_BLIT_CNTL, 1);
551
OUT_RING(ring, A5XX_RB_BLIT_CNTL_BUF(buf));
553
fd5_emit_blit(batch, ring);
557
fd5_emit_tile_mem2gmem(struct fd_batch *batch, const struct fd_tile *tile)
559
struct fd_ringbuffer *ring = batch->gmem;
560
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
561
struct pipe_framebuffer_state *pfb = &batch->framebuffer;
564
* setup mrt and zs with system memory base addresses:
567
emit_mrt(ring, pfb->nr_cbufs, pfb->cbufs, NULL);
568
// emit_zs(ring, pfb->zsbuf, NULL);
570
OUT_PKT4(ring, REG_A5XX_RB_CNTL, 1);
571
OUT_RING(ring, A5XX_RB_CNTL_WIDTH(gmem->bin_w) |
572
A5XX_RB_CNTL_HEIGHT(gmem->bin_h) | A5XX_RB_CNTL_BYPASS);
574
if (fd_gmem_needs_restore(batch, tile, FD_BUFFER_COLOR)) {
576
for (i = 0; i < pfb->nr_cbufs; i++) {
579
if (!(batch->restore & (PIPE_CLEAR_COLOR0 << i)))
581
emit_mem2gmem_surf(batch, gmem->cbuf_base[i], pfb->cbufs[i],
586
if (fd_gmem_needs_restore(batch, tile,
587
FD_BUFFER_DEPTH | FD_BUFFER_STENCIL)) {
588
struct fd_resource *rsc = fd_resource(pfb->zsbuf->texture);
590
if (!rsc->stencil || fd_gmem_needs_restore(batch, tile, FD_BUFFER_DEPTH))
591
emit_mem2gmem_surf(batch, gmem->zsbuf_base[0], pfb->zsbuf, BLIT_ZS);
592
if (rsc->stencil && fd_gmem_needs_restore(batch, tile, FD_BUFFER_STENCIL))
593
emit_mem2gmem_surf(batch, gmem->zsbuf_base[1], pfb->zsbuf, BLIT_S);
597
/* before IB to rendering cmds: */
599
fd5_emit_tile_renderprep(struct fd_batch *batch, const struct fd_tile *tile)
601
struct fd_ringbuffer *ring = batch->gmem;
602
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
603
struct pipe_framebuffer_state *pfb = &batch->framebuffer;
605
OUT_PKT4(ring, REG_A5XX_RB_CNTL, 1);
607
A5XX_RB_CNTL_WIDTH(gmem->bin_w) | A5XX_RB_CNTL_HEIGHT(gmem->bin_h));
609
emit_zs(ring, pfb->zsbuf, gmem);
610
emit_mrt(ring, pfb->nr_cbufs, pfb->cbufs, gmem);
611
emit_msaa(ring, pfb->samples);
615
* transfer from gmem to system memory (ie. normal RAM)
619
emit_gmem2mem_surf(struct fd_batch *batch, uint32_t base,
620
struct pipe_surface *psurf, enum a5xx_blit_buf buf)
622
struct fd_ringbuffer *ring = batch->gmem;
623
struct fd_resource *rsc = fd_resource(psurf->texture);
625
uint32_t offset, pitch;
634
fd_resource_offset(rsc, psurf->u.tex.level, psurf->u.tex.first_layer);
635
pitch = fd_resource_pitch(rsc, psurf->u.tex.level);
637
debug_assert(psurf->u.tex.first_layer == psurf->u.tex.last_layer);
639
OUT_PKT4(ring, REG_A5XX_RB_BLIT_FLAG_DST_LO, 4);
640
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_LO */
641
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_HI */
642
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_PITCH */
643
OUT_RING(ring, 0x00000000); /* RB_BLIT_FLAG_DST_ARRAY_PITCH */
645
tiled = fd_resource_tile_mode(psurf->texture, psurf->u.tex.level);
647
OUT_PKT4(ring, REG_A5XX_RB_RESOLVE_CNTL_3, 5);
648
OUT_RING(ring, 0x00000004 | /* XXX RB_RESOLVE_CNTL_3 */
649
COND(tiled, A5XX_RB_RESOLVE_CNTL_3_TILED));
650
OUT_RELOC(ring, rsc->bo, offset, 0, 0); /* RB_BLIT_DST_LO/HI */
651
OUT_RING(ring, A5XX_RB_BLIT_DST_PITCH(pitch));
652
OUT_RING(ring, A5XX_RB_BLIT_DST_ARRAY_PITCH(fd_resource_layer_stride(rsc, psurf->u.tex.level)));
654
OUT_PKT4(ring, REG_A5XX_RB_BLIT_CNTL, 1);
655
OUT_RING(ring, A5XX_RB_BLIT_CNTL_BUF(buf));
657
// bool msaa_resolve = pfb->samples > 1;
658
bool msaa_resolve = false;
659
OUT_PKT4(ring, REG_A5XX_RB_CLEAR_CNTL, 1);
660
OUT_RING(ring, COND(msaa_resolve, A5XX_RB_CLEAR_CNTL_MSAA_RESOLVE));
662
fd5_emit_blit(batch, ring);
666
fd5_emit_tile_gmem2mem(struct fd_batch *batch, const struct fd_tile *tile)
668
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
669
struct pipe_framebuffer_state *pfb = &batch->framebuffer;
671
if (batch->resolve & (FD_BUFFER_DEPTH | FD_BUFFER_STENCIL)) {
672
struct fd_resource *rsc = fd_resource(pfb->zsbuf->texture);
674
if (!rsc->stencil || (batch->resolve & FD_BUFFER_DEPTH))
675
emit_gmem2mem_surf(batch, gmem->zsbuf_base[0], pfb->zsbuf, BLIT_ZS);
676
if (rsc->stencil && (batch->resolve & FD_BUFFER_STENCIL))
677
emit_gmem2mem_surf(batch, gmem->zsbuf_base[1], pfb->zsbuf, BLIT_S);
680
if (batch->resolve & FD_BUFFER_COLOR) {
682
for (i = 0; i < pfb->nr_cbufs; i++) {
685
if (!(batch->resolve & (PIPE_CLEAR_COLOR0 << i)))
687
emit_gmem2mem_surf(batch, gmem->cbuf_base[i], pfb->cbufs[i],
694
fd5_emit_tile_fini(struct fd_batch *batch) assert_dt
696
struct fd_ringbuffer *ring = batch->gmem;
698
OUT_PKT7(ring, CP_SKIP_IB2_ENABLE_GLOBAL, 1);
701
fd5_emit_lrz_flush(batch, ring);
703
fd5_cache_flush(batch, ring);
704
fd5_set_render_mode(batch->ctx, ring, BYPASS);
708
fd5_emit_sysmem_prep(struct fd_batch *batch) assert_dt
710
struct fd_ringbuffer *ring = batch->gmem;
712
fd5_emit_restore(batch, ring);
714
fd5_emit_lrz_flush(batch, ring);
717
fd5_emit_ib(ring, batch->prologue);
719
OUT_PKT7(ring, CP_SKIP_IB2_ENABLE_GLOBAL, 1);
722
fd5_event_write(batch, ring, PC_CCU_INVALIDATE_COLOR, false);
724
OUT_PKT4(ring, REG_A5XX_PC_POWER_CNTL, 1);
725
OUT_RING(ring, 0x00000003); /* PC_POWER_CNTL */
727
OUT_PKT4(ring, REG_A5XX_VFD_POWER_CNTL, 1);
728
OUT_RING(ring, 0x00000003); /* VFD_POWER_CNTL */
730
/* 0x10000000 for BYPASS.. 0x7c13c080 for GMEM: */
732
OUT_PKT4(ring, REG_A5XX_RB_CCU_CNTL, 1);
733
OUT_RING(ring, 0x10000000); /* RB_CCU_CNTL */
735
OUT_PKT4(ring, REG_A5XX_RB_CNTL, 1);
736
OUT_RING(ring, A5XX_RB_CNTL_WIDTH(0) | A5XX_RB_CNTL_HEIGHT(0) |
737
A5XX_RB_CNTL_BYPASS);
739
/* remaining setup below here does not apply to blit/compute: */
743
struct pipe_framebuffer_state *pfb = &batch->framebuffer;
745
OUT_PKT4(ring, REG_A5XX_GRAS_SC_WINDOW_SCISSOR_TL, 2);
746
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_TL_X(0) |
747
A5XX_GRAS_SC_WINDOW_SCISSOR_TL_Y(0));
748
OUT_RING(ring, A5XX_GRAS_SC_WINDOW_SCISSOR_BR_X(pfb->width - 1) |
749
A5XX_GRAS_SC_WINDOW_SCISSOR_BR_Y(pfb->height - 1));
751
OUT_PKT4(ring, REG_A5XX_RB_RESOLVE_CNTL_1, 2);
752
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_1_X(0) | A5XX_RB_RESOLVE_CNTL_1_Y(0));
753
OUT_RING(ring, A5XX_RB_RESOLVE_CNTL_2_X(pfb->width - 1) |
754
A5XX_RB_RESOLVE_CNTL_2_Y(pfb->height - 1));
756
OUT_PKT4(ring, REG_A5XX_RB_WINDOW_OFFSET, 1);
757
OUT_RING(ring, A5XX_RB_WINDOW_OFFSET_X(0) | A5XX_RB_WINDOW_OFFSET_Y(0));
759
/* Enable stream output, since there's no binning pass to put it in. */
760
OUT_PKT4(ring, REG_A5XX_VPC_SO_OVERRIDE, 1);
763
OUT_PKT7(ring, CP_SET_VISIBILITY_OVERRIDE, 1);
766
patch_draws(batch, IGNORE_VISIBILITY);
768
emit_zs(ring, pfb->zsbuf, NULL);
769
emit_mrt(ring, pfb->nr_cbufs, pfb->cbufs, NULL);
770
emit_msaa(ring, pfb->samples);
774
fd5_emit_sysmem_fini(struct fd_batch *batch)
776
struct fd_ringbuffer *ring = batch->gmem;
778
OUT_PKT7(ring, CP_SKIP_IB2_ENABLE_GLOBAL, 1);
781
fd5_emit_lrz_flush(batch, ring);
783
fd5_event_write(batch, ring, PC_CCU_FLUSH_COLOR_TS, true);
784
fd5_event_write(batch, ring, PC_CCU_FLUSH_DEPTH_TS, true);
788
fd5_gmem_init(struct pipe_context *pctx) disable_thread_safety_analysis
790
struct fd_context *ctx = fd_context(pctx);
792
ctx->emit_tile_init = fd5_emit_tile_init;
793
ctx->emit_tile_prep = fd5_emit_tile_prep;
794
ctx->emit_tile_mem2gmem = fd5_emit_tile_mem2gmem;
795
ctx->emit_tile_renderprep = fd5_emit_tile_renderprep;
796
ctx->emit_tile_gmem2mem = fd5_emit_tile_gmem2mem;
797
ctx->emit_tile_fini = fd5_emit_tile_fini;
798
ctx->emit_sysmem_prep = fd5_emit_sysmem_prep;
799
ctx->emit_sysmem_fini = fd5_emit_sysmem_fini;