/* * Copyright 2008 Ben Skeggs * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. */ #include "pipe/p_state.h" #include "pipe/p_defines.h" #include "util/u_inlines.h" #include "util/u_format.h" #include "nv50/nv50_context.h" #include "nv50/nv50_resource.h" uint32_t nv50_tex_choose_tile_dims_helper(unsigned nx, unsigned ny, unsigned nz, bool is_3d) { uint32_t tile_mode = 0x000; if (ny > 64) tile_mode = 0x040; /* height 128 tiles */ else if (ny > 32) tile_mode = 0x030; /* height 64 tiles */ else if (ny > 16) tile_mode = 0x020; /* height 32 tiles */ else if (ny > 8) tile_mode = 0x010; /* height 16 tiles */ if (!is_3d) return tile_mode; else if (tile_mode > 0x020) tile_mode = 0x020; if (nz > 16 && tile_mode < 0x020) return tile_mode | 0x500; /* depth 32 tiles */ if (nz > 8) return tile_mode | 0x400; /* depth 16 tiles */ if (nz > 4) return tile_mode | 0x300; /* depth 8 tiles */ if (nz > 2) return tile_mode | 0x200; /* depth 4 tiles */ if (nz > 1) return tile_mode | 0x100; /* depth 2 tiles */ return tile_mode; } static uint32_t nv50_tex_choose_tile_dims(unsigned nx, unsigned ny, unsigned nz, bool is_3d) { return nv50_tex_choose_tile_dims_helper(nx, ny * 2, nz, is_3d); } static uint32_t nv50_mt_choose_storage_type(struct nv50_miptree *mt, bool compressed) { const unsigned ms = util_logbase2(mt->base.base.nr_samples); uint32_t tile_flags; if (unlikely(mt->base.base.flags & NOUVEAU_RESOURCE_FLAG_LINEAR)) return 0; if (unlikely(mt->base.base.bind & PIPE_BIND_CURSOR)) return 0; switch (mt->base.base.format) { case PIPE_FORMAT_Z16_UNORM: tile_flags = 0x6c + ms; break; case PIPE_FORMAT_X8Z24_UNORM: case PIPE_FORMAT_S8X24_UINT: case PIPE_FORMAT_S8_UINT_Z24_UNORM: tile_flags = 0x18 + ms; break; case PIPE_FORMAT_X24S8_UINT: case PIPE_FORMAT_Z24X8_UNORM: case PIPE_FORMAT_Z24_UNORM_S8_UINT: tile_flags = 0x128 + ms; break; case PIPE_FORMAT_Z32_FLOAT: tile_flags = 0x40 + ms; break; case PIPE_FORMAT_X32_S8X24_UINT: case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT: tile_flags = 0x60 + ms; break; default: /* Most color formats don't work with compression. */ compressed = false; /* fallthrough */ case PIPE_FORMAT_R8G8B8A8_UNORM: case PIPE_FORMAT_R8G8B8A8_SRGB: case PIPE_FORMAT_R8G8B8X8_UNORM: case PIPE_FORMAT_R8G8B8X8_SRGB: case PIPE_FORMAT_B8G8R8A8_UNORM: case PIPE_FORMAT_B8G8R8A8_SRGB: case PIPE_FORMAT_B8G8R8X8_UNORM: case PIPE_FORMAT_B8G8R8X8_SRGB: case PIPE_FORMAT_R10G10B10A2_UNORM: case PIPE_FORMAT_B10G10R10A2_UNORM: case PIPE_FORMAT_R16G16B16A16_FLOAT: case PIPE_FORMAT_R16G16B16X16_FLOAT: case PIPE_FORMAT_R11G11B10_FLOAT: switch (util_format_get_blocksizebits(mt->base.base.format)) { case 128: assert(ms < 3); tile_flags = 0x74; break; case 64: switch (ms) { case 2: tile_flags = 0xfc; break; case 3: tile_flags = 0xfd; break; default: tile_flags = 0x70; break; } break; case 32: if (mt->base.base.bind & PIPE_BIND_SCANOUT) { assert(ms == 0); tile_flags = 0x7a; } else { switch (ms) { case 2: tile_flags = 0xf8; break; case 3: tile_flags = 0xf9; break; default: tile_flags = 0x70; break; } } break; case 16: case 8: tile_flags = 0x70; break; default: return 0; } if (mt->base.base.bind & PIPE_BIND_CURSOR) tile_flags = 0; } if (!compressed) tile_flags &= ~0x180; return tile_flags; } void nv50_miptree_destroy(struct pipe_screen *pscreen, struct pipe_resource *pt) { struct nv50_miptree *mt = nv50_miptree(pt); if (mt->base.fence && mt->base.fence->state < NOUVEAU_FENCE_STATE_FLUSHED) nouveau_fence_work(mt->base.fence, nouveau_fence_unref_bo, mt->base.bo); else nouveau_bo_ref(NULL, &mt->base.bo); nouveau_fence_ref(NULL, &mt->base.fence); nouveau_fence_ref(NULL, &mt->base.fence_wr); NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_count, -1); NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_bytes, -(uint64_t)mt->total_size); FREE(mt); } boolean nv50_miptree_get_handle(struct pipe_screen *pscreen, struct pipe_resource *pt, struct winsys_handle *whandle) { struct nv50_miptree *mt = nv50_miptree(pt); unsigned stride; if (!mt || !mt->base.bo) return false; stride = mt->level[0].pitch; return nouveau_screen_bo_get_handle(pscreen, mt->base.bo, stride, whandle); } const struct u_resource_vtbl nv50_miptree_vtbl = { nv50_miptree_get_handle, /* get_handle */ nv50_miptree_destroy, /* resource_destroy */ nv50_miptree_transfer_map, /* transfer_map */ u_default_transfer_flush_region, /* transfer_flush_region */ nv50_miptree_transfer_unmap, /* transfer_unmap */ }; static inline bool nv50_miptree_init_ms_mode(struct nv50_miptree *mt) { switch (mt->base.base.nr_samples) { case 8: mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS8; mt->ms_x = 2; mt->ms_y = 1; break; case 4: mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS4; mt->ms_x = 1; mt->ms_y = 1; break; case 2: mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS2; mt->ms_x = 1; break; case 1: case 0: mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS1; break; default: NOUVEAU_ERR("invalid nr_samples: %u\n", mt->base.base.nr_samples); return false; } return true; } bool nv50_miptree_init_layout_linear(struct nv50_miptree *mt, unsigned pitch_align) { struct pipe_resource *pt = &mt->base.base; const unsigned blocksize = util_format_get_blocksize(pt->format); unsigned h = pt->height0; if (util_format_is_depth_or_stencil(pt->format)) return false; if ((pt->last_level > 0) || (pt->depth0 > 1) || (pt->array_size > 1)) return false; if (mt->ms_x | mt->ms_y) return false; mt->level[0].pitch = align(pt->width0 * blocksize, pitch_align); /* Account for very generous prefetch (allocate size as if tiled). */ h = MAX2(h, 8); h = util_next_power_of_two(h); mt->total_size = mt->level[0].pitch * h; return true; } static void nv50_miptree_init_layout_video(struct nv50_miptree *mt) { const struct pipe_resource *pt = &mt->base.base; const unsigned blocksize = util_format_get_blocksize(pt->format); assert(pt->last_level == 0); assert(mt->ms_x == 0 && mt->ms_y == 0); assert(!util_format_is_compressed(pt->format)); mt->layout_3d = pt->target == PIPE_TEXTURE_3D; mt->level[0].tile_mode = 0x20; mt->level[0].pitch = align(pt->width0 * blocksize, 64); mt->total_size = align(pt->height0, 16) * mt->level[0].pitch * (mt->layout_3d ? pt->depth0 : 1); if (pt->array_size > 1) { mt->layer_stride = align(mt->total_size, NV50_TILE_SIZE(0x20)); mt->total_size = mt->layer_stride * pt->array_size; } } static void nv50_miptree_init_layout_tiled(struct nv50_miptree *mt) { struct pipe_resource *pt = &mt->base.base; unsigned w, h, d, l; const unsigned blocksize = util_format_get_blocksize(pt->format); mt->layout_3d = pt->target == PIPE_TEXTURE_3D; w = pt->width0 << mt->ms_x; h = pt->height0 << mt->ms_y; /* For 3D textures, a mipmap is spanned by all the layers, for array * textures and cube maps, each layer contains its own mipmaps. */ d = mt->layout_3d ? pt->depth0 : 1; for (l = 0; l <= pt->last_level; ++l) { struct nv50_miptree_level *lvl = &mt->level[l]; unsigned tsx, tsy, tsz; unsigned nbx = util_format_get_nblocksx(pt->format, w); unsigned nby = util_format_get_nblocksy(pt->format, h); lvl->offset = mt->total_size; lvl->tile_mode = nv50_tex_choose_tile_dims(nbx, nby, d, mt->layout_3d); tsx = NV50_TILE_SIZE_X(lvl->tile_mode); /* x is tile row pitch in bytes */ tsy = NV50_TILE_SIZE_Y(lvl->tile_mode); tsz = NV50_TILE_SIZE_Z(lvl->tile_mode); lvl->pitch = align(nbx * blocksize, tsx); mt->total_size += lvl->pitch * align(nby, tsy) * align(d, tsz); w = u_minify(w, 1); h = u_minify(h, 1); d = u_minify(d, 1); } if (pt->array_size > 1) { mt->layer_stride = align(mt->total_size, NV50_TILE_SIZE(mt->level[0].tile_mode)); mt->total_size = mt->layer_stride * pt->array_size; } } struct pipe_resource * nv50_miptree_create(struct pipe_screen *pscreen, const struct pipe_resource *templ) { struct nouveau_device *dev = nouveau_screen(pscreen)->device; struct nouveau_drm *drm = nouveau_screen(pscreen)->drm; struct nv50_miptree *mt = CALLOC_STRUCT(nv50_miptree); struct pipe_resource *pt = &mt->base.base; bool compressed = drm->version >= 0x01000101; int ret; union nouveau_bo_config bo_config; uint32_t bo_flags; if (!mt) return NULL; mt->base.vtbl = &nv50_miptree_vtbl; *pt = *templ; pipe_reference_init(&pt->reference, 1); pt->screen = pscreen; if (pt->bind & PIPE_BIND_LINEAR) pt->flags |= NOUVEAU_RESOURCE_FLAG_LINEAR; bo_config.nv50.memtype = nv50_mt_choose_storage_type(mt, compressed); if (!nv50_miptree_init_ms_mode(mt)) { FREE(mt); return NULL; } if (unlikely(pt->flags & NV50_RESOURCE_FLAG_VIDEO)) { nv50_miptree_init_layout_video(mt); if (pt->flags & NV50_RESOURCE_FLAG_NOALLOC) { /* BO allocation done by client */ return pt; } } else if (bo_config.nv50.memtype != 0) { nv50_miptree_init_layout_tiled(mt); } else if (!nv50_miptree_init_layout_linear(mt, 64)) { FREE(mt); return NULL; } bo_config.nv50.tile_mode = mt->level[0].tile_mode; if (!bo_config.nv50.memtype && (pt->bind & PIPE_BIND_SHARED)) mt->base.domain = NOUVEAU_BO_GART; else mt->base.domain = NV_VRAM_DOMAIN(nouveau_screen(pscreen)); bo_flags = mt->base.domain | NOUVEAU_BO_NOSNOOP; if (mt->base.base.bind & (PIPE_BIND_CURSOR | PIPE_BIND_DISPLAY_TARGET)) bo_flags |= NOUVEAU_BO_CONTIG; ret = nouveau_bo_new(dev, bo_flags, 4096, mt->total_size, &bo_config, &mt->base.bo); if (ret) { FREE(mt); return NULL; } mt->base.address = mt->base.bo->offset; return pt; } struct pipe_resource * nv50_miptree_from_handle(struct pipe_screen *pscreen, const struct pipe_resource *templ, struct winsys_handle *whandle) { struct nv50_miptree *mt; unsigned stride; /* only supports 2D, non-mipmapped textures for the moment */ if ((templ->target != PIPE_TEXTURE_2D && templ->target != PIPE_TEXTURE_RECT) || templ->last_level != 0 || templ->depth0 != 1 || templ->array_size > 1) return NULL; mt = CALLOC_STRUCT(nv50_miptree); if (!mt) return NULL; mt->base.bo = nouveau_screen_bo_from_handle(pscreen, whandle, &stride); if (mt->base.bo == NULL) { FREE(mt); return NULL; } mt->base.domain = mt->base.bo->flags & NOUVEAU_BO_APER; mt->base.address = mt->base.bo->offset; mt->base.base = *templ; mt->base.vtbl = &nv50_miptree_vtbl; pipe_reference_init(&mt->base.base.reference, 1); mt->base.base.screen = pscreen; mt->level[0].pitch = stride; mt->level[0].offset = 0; mt->level[0].tile_mode = mt->base.bo->config.nv50.tile_mode; NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_count, 1); /* no need to adjust bo reference count */ return &mt->base.base; } /* Offset of zslice @z from start of level @l. */ inline unsigned nv50_mt_zslice_offset(const struct nv50_miptree *mt, unsigned l, unsigned z) { const struct pipe_resource *pt = &mt->base.base; unsigned tds = NV50_TILE_SHIFT_Z(mt->level[l].tile_mode); unsigned ths = NV50_TILE_SHIFT_Y(mt->level[l].tile_mode); unsigned nby = util_format_get_nblocksy(pt->format, u_minify(pt->height0, l)); /* to next 2D tile slice within a 3D tile */ unsigned stride_2d = NV50_TILE_SIZE_2D(mt->level[l].tile_mode); /* to slice in the next (in z direction) 3D tile */ unsigned stride_3d = (align(nby, (1 << ths)) * mt->level[l].pitch) << tds; return (z & ((1 << tds) - 1)) * stride_2d + (z >> tds) * stride_3d; } /* Surface functions. */ struct nv50_surface * nv50_surface_from_miptree(struct nv50_miptree *mt, const struct pipe_surface *templ) { struct pipe_surface *ps; struct nv50_surface *ns = CALLOC_STRUCT(nv50_surface); if (!ns) return NULL; ps = &ns->base; pipe_reference_init(&ps->reference, 1); pipe_resource_reference(&ps->texture, &mt->base.base); ps->format = templ->format; ps->writable = templ->writable; ps->u.tex.level = templ->u.tex.level; ps->u.tex.first_layer = templ->u.tex.first_layer; ps->u.tex.last_layer = templ->u.tex.last_layer; ns->width = u_minify(mt->base.base.width0, ps->u.tex.level); ns->height = u_minify(mt->base.base.height0, ps->u.tex.level); ns->depth = ps->u.tex.last_layer - ps->u.tex.first_layer + 1; ns->offset = mt->level[templ->u.tex.level].offset; /* comment says there are going to be removed, but they're used by the st */ ps->width = ns->width; ps->height = ns->height; ns->width <<= mt->ms_x; ns->height <<= mt->ms_y; return ns; } struct pipe_surface * nv50_miptree_surface_new(struct pipe_context *pipe, struct pipe_resource *pt, const struct pipe_surface *templ) { struct nv50_miptree *mt = nv50_miptree(pt); struct nv50_surface *ns = nv50_surface_from_miptree(mt, templ); if (!ns) return NULL; ns->base.context = pipe; if (ns->base.u.tex.first_layer) { const unsigned l = ns->base.u.tex.level; const unsigned z = ns->base.u.tex.first_layer; if (mt->layout_3d) { ns->offset += nv50_mt_zslice_offset(mt, l, z); /* TODO: switch to depth 1 tiles; but actually this shouldn't happen */ if (ns->depth > 1 && (z & (NV50_TILE_SIZE_Z(mt->level[l].tile_mode) - 1))) NOUVEAU_ERR("Creating unsupported 3D surface !\n"); } else { ns->offset += mt->layer_stride * z; } } return &ns->base; }