#include "util/u_format.h" #include "nv50/nv50_context.h" #include "nv50/nv50_defs.xml.h" struct nv50_transfer { struct pipe_transfer base; struct nv50_m2mf_rect rect[2]; uint32_t nblocksx; uint32_t nblocksy; }; void nv50_m2mf_rect_setup(struct nv50_m2mf_rect *rect, struct pipe_resource *restrict res, unsigned l, unsigned x, unsigned y, unsigned z) { struct nv50_miptree *mt = nv50_miptree(res); const unsigned w = u_minify(res->width0, l); const unsigned h = u_minify(res->height0, l); rect->bo = mt->base.bo; rect->domain = mt->base.domain; rect->base = mt->level[l].offset; if (mt->base.bo->offset != mt->base.address) rect->base += mt->base.address - mt->base.bo->offset; rect->pitch = mt->level[l].pitch; if (util_format_is_plain(res->format)) { rect->width = w << mt->ms_x; rect->height = h << mt->ms_y; rect->x = x << mt->ms_x; rect->y = y << mt->ms_y; } else { rect->width = util_format_get_nblocksx(res->format, w); rect->height = util_format_get_nblocksy(res->format, h); rect->x = util_format_get_nblocksx(res->format, x); rect->y = util_format_get_nblocksy(res->format, y); } rect->tile_mode = mt->level[l].tile_mode; rect->cpp = util_format_get_blocksize(res->format); if (mt->layout_3d) { rect->z = z; rect->depth = u_minify(res->depth0, l); } else { rect->base += z * mt->layer_stride; rect->z = 0; rect->depth = 1; } } void nv50_m2mf_transfer_rect(struct nv50_context *nv50, const struct nv50_m2mf_rect *dst, const struct nv50_m2mf_rect *src, uint32_t nblocksx, uint32_t nblocksy) { struct nouveau_pushbuf *push = nv50->base.pushbuf; struct nouveau_bufctx *bctx = nv50->bufctx; const int cpp = dst->cpp; uint32_t src_ofst = src->base; uint32_t dst_ofst = dst->base; uint32_t height = nblocksy; uint32_t sy = src->y; uint32_t dy = dst->y; assert(dst->cpp == src->cpp); nouveau_bufctx_refn(bctx, 0, src->bo, src->domain | NOUVEAU_BO_RD); nouveau_bufctx_refn(bctx, 0, dst->bo, dst->domain | NOUVEAU_BO_WR); nouveau_pushbuf_bufctx(push, bctx); nouveau_pushbuf_validate(push); if (nouveau_bo_memtype(src->bo)) { BEGIN_NV04(push, NV50_M2MF(LINEAR_IN), 6); PUSH_DATA (push, 0); PUSH_DATA (push, src->tile_mode); PUSH_DATA (push, src->width * cpp); PUSH_DATA (push, src->height); PUSH_DATA (push, src->depth); PUSH_DATA (push, src->z); } else { src_ofst += src->y * src->pitch + src->x * cpp; BEGIN_NV04(push, NV50_M2MF(LINEAR_IN), 1); PUSH_DATA (push, 1); BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_PITCH_IN), 1); PUSH_DATA (push, src->pitch); } if (nouveau_bo_memtype(dst->bo)) { BEGIN_NV04(push, NV50_M2MF(LINEAR_OUT), 6); PUSH_DATA (push, 0); PUSH_DATA (push, dst->tile_mode); PUSH_DATA (push, dst->width * cpp); PUSH_DATA (push, dst->height); PUSH_DATA (push, dst->depth); PUSH_DATA (push, dst->z); } else { dst_ofst += dst->y * dst->pitch + dst->x * cpp; BEGIN_NV04(push, NV50_M2MF(LINEAR_OUT), 1); PUSH_DATA (push, 1); BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_PITCH_OUT), 1); PUSH_DATA (push, dst->pitch); } while (height) { int line_count = height > 2047 ? 2047 : height; BEGIN_NV04(push, NV50_M2MF(OFFSET_IN_HIGH), 2); PUSH_DATAh(push, src->bo->offset + src_ofst); PUSH_DATAh(push, dst->bo->offset + dst_ofst); BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_OFFSET_IN), 2); PUSH_DATA (push, src->bo->offset + src_ofst); PUSH_DATA (push, dst->bo->offset + dst_ofst); if (nouveau_bo_memtype(src->bo)) { BEGIN_NV04(push, NV50_M2MF(TILING_POSITION_IN), 1); PUSH_DATA (push, (sy << 16) | (src->x * cpp)); } else { src_ofst += line_count * src->pitch; } if (nouveau_bo_memtype(dst->bo)) { BEGIN_NV04(push, NV50_M2MF(TILING_POSITION_OUT), 1); PUSH_DATA (push, (dy << 16) | (dst->x * cpp)); } else { dst_ofst += line_count * dst->pitch; } BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_LINE_LENGTH_IN), 4); PUSH_DATA (push, nblocksx * cpp); PUSH_DATA (push, line_count); PUSH_DATA (push, (1 << 8) | (1 << 0)); PUSH_DATA (push, 0); height -= line_count; sy += line_count; dy += line_count; } nouveau_bufctx_reset(bctx, 0); } void nv50_sifc_linear_u8(struct nouveau_context *nv, struct nouveau_bo *dst, unsigned offset, unsigned domain, unsigned size, const void *data) { struct nv50_context *nv50 = nv50_context(&nv->pipe); struct nouveau_pushbuf *push = nv50->base.pushbuf; uint32_t *src = (uint32_t *)data; unsigned count = (size + 3) / 4; unsigned xcoord = offset & 0xff; nouveau_bufctx_refn(nv50->bufctx, 0, dst, domain | NOUVEAU_BO_WR); nouveau_pushbuf_bufctx(push, nv50->bufctx); nouveau_pushbuf_validate(push); offset &= ~0xff; BEGIN_NV04(push, NV50_2D(DST_FORMAT), 2); PUSH_DATA (push, NV50_SURFACE_FORMAT_R8_UNORM); PUSH_DATA (push, 1); BEGIN_NV04(push, NV50_2D(DST_PITCH), 5); PUSH_DATA (push, 262144); PUSH_DATA (push, 65536); PUSH_DATA (push, 1); PUSH_DATAh(push, dst->offset + offset); PUSH_DATA (push, dst->offset + offset); BEGIN_NV04(push, NV50_2D(SIFC_BITMAP_ENABLE), 2); PUSH_DATA (push, 0); PUSH_DATA (push, NV50_SURFACE_FORMAT_R8_UNORM); BEGIN_NV04(push, NV50_2D(SIFC_WIDTH), 10); PUSH_DATA (push, size); PUSH_DATA (push, 1); PUSH_DATA (push, 0); PUSH_DATA (push, 1); PUSH_DATA (push, 0); PUSH_DATA (push, 1); PUSH_DATA (push, 0); PUSH_DATA (push, xcoord); PUSH_DATA (push, 0); PUSH_DATA (push, 0); while (count) { unsigned nr = MIN2(count, NV04_PFIFO_MAX_PACKET_LEN); BEGIN_NI04(push, NV50_2D(SIFC_DATA), nr); PUSH_DATAp(push, src, nr); src += nr; count -= nr; } nouveau_bufctx_reset(nv50->bufctx, 0); } void nv50_m2mf_copy_linear(struct nouveau_context *nv, struct nouveau_bo *dst, unsigned dstoff, unsigned dstdom, struct nouveau_bo *src, unsigned srcoff, unsigned srcdom, unsigned size) { struct nouveau_pushbuf *push = nv->pushbuf; struct nouveau_bufctx *bctx = nv50_context(&nv->pipe)->bufctx; nouveau_bufctx_refn(bctx, 0, src, srcdom | NOUVEAU_BO_RD); nouveau_bufctx_refn(bctx, 0, dst, dstdom | NOUVEAU_BO_WR); nouveau_pushbuf_bufctx(push, bctx); nouveau_pushbuf_validate(push); BEGIN_NV04(push, NV50_M2MF(LINEAR_IN), 1); PUSH_DATA (push, 1); BEGIN_NV04(push, NV50_M2MF(LINEAR_OUT), 1); PUSH_DATA (push, 1); while (size) { unsigned bytes = MIN2(size, 1 << 17); BEGIN_NV04(push, NV50_M2MF(OFFSET_IN_HIGH), 2); PUSH_DATAh(push, src->offset + srcoff); PUSH_DATAh(push, dst->offset + dstoff); BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_OFFSET_IN), 2); PUSH_DATA (push, src->offset + srcoff); PUSH_DATA (push, dst->offset + dstoff); BEGIN_NV04(push, SUBC_M2MF(NV03_M2MF_LINE_LENGTH_IN), 4); PUSH_DATA (push, bytes); PUSH_DATA (push, 1); PUSH_DATA (push, (1 << 8) | (1 << 0)); PUSH_DATA (push, 0); srcoff += bytes; dstoff += bytes; size -= bytes; } nouveau_bufctx_reset(bctx, 0); } void * nv50_miptree_transfer_map(struct pipe_context *pctx, struct pipe_resource *res, unsigned level, unsigned usage, const struct pipe_box *box, struct pipe_transfer **ptransfer) { struct nv50_screen *screen = nv50_screen(pctx->screen); struct nv50_context *nv50 = nv50_context(pctx); struct nouveau_device *dev = nv50->screen->base.device; const struct nv50_miptree *mt = nv50_miptree(res); struct nv50_transfer *tx; uint32_t size; int ret; unsigned flags = 0; if (usage & PIPE_TRANSFER_MAP_DIRECTLY) return NULL; tx = CALLOC_STRUCT(nv50_transfer); if (!tx) return NULL; pipe_resource_reference(&tx->base.resource, res); tx->base.level = level; tx->base.usage = usage; tx->base.box = *box; if (util_format_is_plain(res->format)) { tx->nblocksx = box->width << mt->ms_x; tx->nblocksy = box->height << mt->ms_y; } else { tx->nblocksx = util_format_get_nblocksx(res->format, box->width); tx->nblocksy = util_format_get_nblocksy(res->format, box->height); } tx->base.stride = tx->nblocksx * util_format_get_blocksize(res->format); tx->base.layer_stride = tx->nblocksy * tx->base.stride; nv50_m2mf_rect_setup(&tx->rect[0], res, level, box->x, box->y, box->z); size = tx->base.layer_stride; ret = nouveau_bo_new(dev, NOUVEAU_BO_GART | NOUVEAU_BO_MAP, 0, size * tx->base.box.depth, NULL, &tx->rect[1].bo); if (ret) { FREE(tx); return NULL; } tx->rect[1].cpp = tx->rect[0].cpp; tx->rect[1].width = tx->nblocksx; tx->rect[1].height = tx->nblocksy; tx->rect[1].depth = 1; tx->rect[1].pitch = tx->base.stride; tx->rect[1].domain = NOUVEAU_BO_GART; if (usage & PIPE_TRANSFER_READ) { unsigned base = tx->rect[0].base; unsigned z = tx->rect[0].z; unsigned i; for (i = 0; i < box->depth; ++i) { nv50_m2mf_transfer_rect(nv50, &tx->rect[1], &tx->rect[0], tx->nblocksx, tx->nblocksy); if (mt->layout_3d) tx->rect[0].z++; else tx->rect[0].base += mt->layer_stride; tx->rect[1].base += size; } tx->rect[0].z = z; tx->rect[0].base = base; tx->rect[1].base = 0; } if (tx->rect[1].bo->map) { *ptransfer = &tx->base; return tx->rect[1].bo->map; } if (usage & PIPE_TRANSFER_READ) flags = NOUVEAU_BO_RD; if (usage & PIPE_TRANSFER_WRITE) flags |= NOUVEAU_BO_WR; ret = nouveau_bo_map(tx->rect[1].bo, flags, screen->base.client); if (ret) { nouveau_bo_ref(NULL, &tx->rect[1].bo); FREE(tx); return NULL; } *ptransfer = &tx->base; return tx->rect[1].bo->map; } void nv50_miptree_transfer_unmap(struct pipe_context *pctx, struct pipe_transfer *transfer) { struct nv50_context *nv50 = nv50_context(pctx); struct nv50_transfer *tx = (struct nv50_transfer *)transfer; struct nv50_miptree *mt = nv50_miptree(tx->base.resource); unsigned i; if (tx->base.usage & PIPE_TRANSFER_WRITE) { for (i = 0; i < tx->base.box.depth; ++i) { nv50_m2mf_transfer_rect(nv50, &tx->rect[0], &tx->rect[1], tx->nblocksx, tx->nblocksy); if (mt->layout_3d) tx->rect[0].z++; else tx->rect[0].base += mt->layer_stride; tx->rect[1].base += tx->nblocksy * tx->base.stride; } /* Allow the copies above to finish executing before freeing the source */ nouveau_fence_work(nv50->screen->base.fence.current, nouveau_fence_unref_bo, tx->rect[1].bo); } else { nouveau_bo_ref(NULL, &tx->rect[1].bo); } pipe_resource_reference(&transfer->resource, NULL); FREE(tx); } void nv50_cb_push(struct nouveau_context *nv, struct nouveau_bo *bo, unsigned domain, unsigned base, unsigned size, unsigned offset, unsigned words, const uint32_t *data) { struct nouveau_pushbuf *push = nv->pushbuf; struct nouveau_bufctx *bctx = nv50_context(&nv->pipe)->bufctx; assert(!(offset & 3)); size = align(size, 0x100); nouveau_bufctx_refn(bctx, 0, bo, NOUVEAU_BO_WR | domain); nouveau_pushbuf_bufctx(push, bctx); nouveau_pushbuf_validate(push); while (words) { unsigned nr = MIN2(words, NV04_PFIFO_MAX_PACKET_LEN); PUSH_SPACE(push, nr + 7); BEGIN_NV04(push, NV50_3D(CB_DEF_ADDRESS_HIGH), 3); PUSH_DATAh(push, bo->offset + base); PUSH_DATA (push, bo->offset + base); PUSH_DATA (push, (NV50_CB_TMP << 16) | (size & 0xffff)); BEGIN_NV04(push, NV50_3D(CB_ADDR), 1); PUSH_DATA (push, (offset << 6) | NV50_CB_TMP); BEGIN_NI04(push, NV50_3D(CB_DATA(0)), nr); PUSH_DATAp(push, data, nr); words -= nr; data += nr; offset += nr * 4; } nouveau_bufctx_reset(bctx, 0); }