Commit 9a391ad8 authored by Ben Skeggs's avatar Ben Skeggs

drm/nv50: switch to indirect push buffer controls

PFIFO on G80 and up has a new mode where the main ring buffer is simply a
ring of pointers to indirect buffers containing the actual command/data
packets.  In order to be able to implement index buffers in the 3D driver
we need to be able to submit data-only push buffers right after the cmd
packet header, which is only possible using the new command submission
method.

This commit doesn't make it possible to implement index buffers yet, some
userspace interface changes will be required, but it does allow for
testing/debugging of the hardware-side support in the meantime.
Signed-off-by: default avatarBen Skeggs <bskeggs@redhat.com>
parent ff9e5279
...@@ -47,12 +47,23 @@ nouveau_debugfs_channel_info(struct seq_file *m, void *data) ...@@ -47,12 +47,23 @@ nouveau_debugfs_channel_info(struct seq_file *m, void *data)
seq_printf(m, " cur: 0x%08x\n", chan->dma.cur << 2); seq_printf(m, " cur: 0x%08x\n", chan->dma.cur << 2);
seq_printf(m, " put: 0x%08x\n", chan->dma.put << 2); seq_printf(m, " put: 0x%08x\n", chan->dma.put << 2);
seq_printf(m, " free: 0x%08x\n", chan->dma.free << 2); seq_printf(m, " free: 0x%08x\n", chan->dma.free << 2);
if (chan->dma.ib_max) {
seq_printf(m, " ib max: 0x%08x\n", chan->dma.ib_max);
seq_printf(m, " ib put: 0x%08x\n", chan->dma.ib_put);
seq_printf(m, " ib free: 0x%08x\n", chan->dma.ib_free);
}
seq_printf(m, "gpu fifo state:\n"); seq_printf(m, "gpu fifo state:\n");
seq_printf(m, " get: 0x%08x\n", seq_printf(m, " get: 0x%08x\n",
nvchan_rd32(chan, chan->user_get)); nvchan_rd32(chan, chan->user_get));
seq_printf(m, " put: 0x%08x\n", seq_printf(m, " put: 0x%08x\n",
nvchan_rd32(chan, chan->user_put)); nvchan_rd32(chan, chan->user_put));
if (chan->dma.ib_max) {
seq_printf(m, " ib get: 0x%08x\n",
nvchan_rd32(chan, 0x88));
seq_printf(m, " ib put: 0x%08x\n",
nvchan_rd32(chan, 0x8c));
}
seq_printf(m, "last fence : %d\n", chan->fence.sequence); seq_printf(m, "last fence : %d\n", chan->fence.sequence);
seq_printf(m, "last signalled: %d\n", chan->fence.sequence_ack); seq_printf(m, "last signalled: %d\n", chan->fence.sequence_ack);
......
...@@ -32,7 +32,22 @@ ...@@ -32,7 +32,22 @@
void void
nouveau_dma_pre_init(struct nouveau_channel *chan) nouveau_dma_pre_init(struct nouveau_channel *chan)
{ {
chan->dma.max = (chan->pushbuf_bo->bo.mem.size >> 2) - 2; struct drm_nouveau_private *dev_priv = chan->dev->dev_private;
struct nouveau_bo *pushbuf = chan->pushbuf_bo;
if (dev_priv->card_type == NV_50) {
const int ib_size = pushbuf->bo.mem.size / 2;
chan->dma.ib_base = (pushbuf->bo.mem.size - ib_size) >> 2;
chan->dma.ib_max = (ib_size / 8) - 1;
chan->dma.ib_put = 0;
chan->dma.ib_free = chan->dma.ib_max - chan->dma.ib_put;
chan->dma.max = (pushbuf->bo.mem.size - ib_size) >> 2;
} else {
chan->dma.max = (pushbuf->bo.mem.size >> 2) - 2;
}
chan->dma.put = 0; chan->dma.put = 0;
chan->dma.cur = chan->dma.put; chan->dma.cur = chan->dma.put;
chan->dma.free = chan->dma.max - chan->dma.cur; chan->dma.free = chan->dma.max - chan->dma.cur;
...@@ -162,12 +177,101 @@ READ_GET(struct nouveau_channel *chan, uint32_t *prev_get, uint32_t *timeout) ...@@ -162,12 +177,101 @@ READ_GET(struct nouveau_channel *chan, uint32_t *prev_get, uint32_t *timeout)
return (val - chan->pushbuf_base) >> 2; return (val - chan->pushbuf_base) >> 2;
} }
void
nv50_dma_push(struct nouveau_channel *chan, struct nouveau_bo *bo,
int delta, int dwords)
{
struct nouveau_bo *pb = chan->pushbuf_bo;
uint64_t offset = (bo->bo.mem.mm_node->start << PAGE_SHIFT) + delta;
int ip = (chan->dma.ib_put * 2) + chan->dma.ib_base;
BUG_ON(chan->dma.ib_free < 1);
nouveau_bo_wr32(pb, ip++, offset);
nouveau_bo_wr32(pb, ip++, dwords << 10);
chan->dma.ib_put = (chan->dma.ib_put + 1) & chan->dma.ib_max;
nvchan_wr32(chan, 0x8c, chan->dma.ib_put);
chan->dma.ib_free--;
}
static int
nv50_dma_push_wait(struct nouveau_channel *chan, int count)
{
uint32_t cnt = 0, prev_get = 0;
while (chan->dma.ib_free < count) {
uint32_t get = nvchan_rd32(chan, 0x88);
if (get != prev_get) {
prev_get = get;
cnt = 0;
}
if ((++cnt & 0xff) == 0) {
DRM_UDELAY(1);
if (cnt > 100000)
return -EBUSY;
}
chan->dma.ib_free = get - chan->dma.ib_put;
if (chan->dma.ib_free <= 0)
chan->dma.ib_free += chan->dma.ib_max + 1;
}
return 0;
}
static int
nv50_dma_wait(struct nouveau_channel *chan, int slots, int count)
{
uint32_t cnt = 0, prev_get = 0;
int ret;
ret = nv50_dma_push_wait(chan, slots + 1);
if (unlikely(ret))
return ret;
while (chan->dma.free < count) {
int get = READ_GET(chan, &prev_get, &cnt);
if (unlikely(get < 0)) {
if (get == -EINVAL)
continue;
return get;
}
if (get <= chan->dma.cur) {
chan->dma.free = chan->dma.max - chan->dma.cur;
if (chan->dma.free >= count)
break;
FIRE_RING(chan);
do {
get = READ_GET(chan, &prev_get, &cnt);
if (unlikely(get < 0)) {
if (get == -EINVAL)
continue;
return get;
}
} while (get == 0);
chan->dma.cur = 0;
chan->dma.put = 0;
}
chan->dma.free = get - chan->dma.cur - 1;
}
return 0;
}
int int
nouveau_dma_wait(struct nouveau_channel *chan, int size) nouveau_dma_wait(struct nouveau_channel *chan, int slots, int size)
{ {
uint32_t prev_get = 0, cnt = 0; uint32_t prev_get = 0, cnt = 0;
int get; int get;
if (chan->dma.ib_max)
return nv50_dma_wait(chan, slots, size);
while (chan->dma.free < size) { while (chan->dma.free < size) {
get = READ_GET(chan, &prev_get, &cnt); get = READ_GET(chan, &prev_get, &cnt);
if (unlikely(get == -EBUSY)) if (unlikely(get == -EBUSY))
......
...@@ -31,6 +31,9 @@ ...@@ -31,6 +31,9 @@
#define NOUVEAU_DMA_DEBUG 0 #define NOUVEAU_DMA_DEBUG 0
#endif #endif
void nv50_dma_push(struct nouveau_channel *, struct nouveau_bo *,
int delta, int dwords);
/* /*
* There's a hw race condition where you can't jump to your PUT offset, * There's a hw race condition where you can't jump to your PUT offset,
* to avoid this we jump to offset + SKIPS and fill the difference with * to avoid this we jump to offset + SKIPS and fill the difference with
...@@ -96,13 +99,11 @@ enum { ...@@ -96,13 +99,11 @@ enum {
static __must_check inline int static __must_check inline int
RING_SPACE(struct nouveau_channel *chan, int size) RING_SPACE(struct nouveau_channel *chan, int size)
{ {
if (chan->dma.free < size) { int ret;
int ret;
ret = nouveau_dma_wait(chan, size); ret = nouveau_dma_wait(chan, 1, size);
if (ret) if (ret)
return ret; return ret;
}
chan->dma.free -= size; chan->dma.free -= size;
return 0; return 0;
...@@ -146,7 +147,13 @@ FIRE_RING(struct nouveau_channel *chan) ...@@ -146,7 +147,13 @@ FIRE_RING(struct nouveau_channel *chan)
return; return;
chan->accel_done = true; chan->accel_done = true;
WRITE_PUT(chan->dma.cur); if (chan->dma.ib_max) {
nv50_dma_push(chan, chan->pushbuf_bo, chan->dma.put << 2,
chan->dma.cur - chan->dma.put);
} else {
WRITE_PUT(chan->dma.cur);
}
chan->dma.put = chan->dma.cur; chan->dma.put = chan->dma.cur;
} }
......
...@@ -239,6 +239,11 @@ struct nouveau_channel { ...@@ -239,6 +239,11 @@ struct nouveau_channel {
int cur; int cur;
int put; int put;
/* access via pushbuf_bo */ /* access via pushbuf_bo */
int ib_base;
int ib_max;
int ib_free;
int ib_put;
} dma; } dma;
uint32_t sw_subchannel[8]; uint32_t sw_subchannel[8];
...@@ -848,7 +853,7 @@ nouveau_debugfs_channel_fini(struct nouveau_channel *chan) ...@@ -848,7 +853,7 @@ nouveau_debugfs_channel_fini(struct nouveau_channel *chan)
/* nouveau_dma.c */ /* nouveau_dma.c */
extern void nouveau_dma_pre_init(struct nouveau_channel *); extern void nouveau_dma_pre_init(struct nouveau_channel *);
extern int nouveau_dma_init(struct nouveau_channel *); extern int nouveau_dma_init(struct nouveau_channel *);
extern int nouveau_dma_wait(struct nouveau_channel *, int size); extern int nouveau_dma_wait(struct nouveau_channel *, int slots, int size);
/* nouveau_acpi.c */ /* nouveau_acpi.c */
#ifdef CONFIG_ACPI #ifdef CONFIG_ACPI
......
...@@ -707,7 +707,7 @@ nouveau_gem_ioctl_pushbuf_call(struct drm_device *dev, void *data, ...@@ -707,7 +707,7 @@ nouveau_gem_ioctl_pushbuf_call(struct drm_device *dev, void *data,
uint32_t retaddy; uint32_t retaddy;
if (chan->dma.free < 4 + NOUVEAU_DMA_SKIPS) { if (chan->dma.free < 4 + NOUVEAU_DMA_SKIPS) {
ret = nouveau_dma_wait(chan, 4 + NOUVEAU_DMA_SKIPS); ret = nouveau_dma_wait(chan, 0, 4 + NOUVEAU_DMA_SKIPS);
if (ret) { if (ret) {
NV_ERROR(dev, "jmp_space: %d\n", ret); NV_ERROR(dev, "jmp_space: %d\n", ret);
goto out; goto out;
...@@ -754,6 +754,15 @@ nouveau_gem_ioctl_pushbuf_call(struct drm_device *dev, void *data, ...@@ -754,6 +754,15 @@ nouveau_gem_ioctl_pushbuf_call(struct drm_device *dev, void *data,
} }
} }
if (chan->dma.ib_max) {
ret = nouveau_dma_wait(chan, 2, 6);
if (ret) {
NV_INFO(dev, "nv50cal_space: %d\n", ret);
goto out;
}
nv50_dma_push(chan, pbbo, req->offset, req->nr_dwords);
} else
if (PUSHBUF_CAL) { if (PUSHBUF_CAL) {
ret = RING_SPACE(chan, 2); ret = RING_SPACE(chan, 2);
if (ret) { if (ret) {
...@@ -792,6 +801,10 @@ out: ...@@ -792,6 +801,10 @@ out:
kfree(bo); kfree(bo);
out_next: out_next:
if (chan->dma.ib_max) {
req->suffix0 = 0x00000000;
req->suffix1 = 0x00000000;
} else
if (PUSHBUF_CAL) { if (PUSHBUF_CAL) {
req->suffix0 = 0x00020000; req->suffix0 = 0x00020000;
req->suffix1 = 0x00000000; req->suffix1 = 0x00000000;
......
...@@ -283,17 +283,17 @@ nv50_fifo_create_context(struct nouveau_channel *chan) ...@@ -283,17 +283,17 @@ nv50_fifo_create_context(struct nouveau_channel *chan)
dev_priv->engine.instmem.prepare_access(dev, true); dev_priv->engine.instmem.prepare_access(dev, true);
nv_wo32(dev, ramfc, 0x08/4, chan->pushbuf_base);
nv_wo32(dev, ramfc, 0x10/4, chan->pushbuf_base);
nv_wo32(dev, ramfc, 0x48/4, chan->pushbuf->instance >> 4); nv_wo32(dev, ramfc, 0x48/4, chan->pushbuf->instance >> 4);
nv_wo32(dev, ramfc, 0x80/4, (0xc << 24) | (chan->ramht->instance >> 4)); nv_wo32(dev, ramfc, 0x80/4, (0xc << 24) | (chan->ramht->instance >> 4));
nv_wo32(dev, ramfc, 0x3c/4, 0x00086078);
nv_wo32(dev, ramfc, 0x44/4, 0x2101ffff); nv_wo32(dev, ramfc, 0x44/4, 0x2101ffff);
nv_wo32(dev, ramfc, 0x60/4, 0x7fffffff); nv_wo32(dev, ramfc, 0x60/4, 0x7fffffff);
nv_wo32(dev, ramfc, 0x40/4, 0x00000000); nv_wo32(dev, ramfc, 0x40/4, 0x00000000);
nv_wo32(dev, ramfc, 0x7c/4, 0x30000001); nv_wo32(dev, ramfc, 0x7c/4, 0x30000001);
nv_wo32(dev, ramfc, 0x78/4, 0x00000000); nv_wo32(dev, ramfc, 0x78/4, 0x00000000);
nv_wo32(dev, ramfc, 0x4c/4, 0xffffffff); nv_wo32(dev, ramfc, 0x3c/4, 0x403f6078);
nv_wo32(dev, ramfc, 0x50/4, chan->pushbuf_base +
chan->dma.ib_base * 4);
nv_wo32(dev, ramfc, 0x54/4, drm_order(chan->dma.ib_max + 1) << 16);
if (!IS_G80) { if (!IS_G80) {
nv_wo32(dev, chan->ramin->gpuobj, 0, chan->id); nv_wo32(dev, chan->ramin->gpuobj, 0, chan->id);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment