These changes are the raw update to linux-4.4.6-rt14. Kernel sources

[kvmfornfv.git] / kernel / drivers / gpu / drm / nouveau / nvkm / engine / gr / ctxgf100.c
diff --git a/kernel/drivers/gpu/drm/nouveau/nvkm/engine/gr/ctxgf100.c b/kernel/drivers/gpu/drm/nouveau/nvkm/engine/gr/ctxgf100.c

index 57e2c5b..56f392d 100644 (file)
--- a/kernel/drivers/gpu/drm/nouveau/nvkm/engine/gr/ctxgf100.c
+++ b/kernel/drivers/gpu/drm/nouveau/nvkm/engine/gr/ctxgf100.c
@@ -23,7 +23,6 @@
   */
  #include "ctxgf100.h"
  
-#include <subdev/bar.h>
  #include <subdev/fb.h>
  #include <subdev/mc.h>
  #include <subdev/timer.h>
@@ -1005,6 +1004,7 @@ void
  gf100_grctx_mmio_item(struct gf100_grctx *info, u32 addr, u32 data,
                       int shift, int buffer)
  {
+       struct nvkm_device *device = info->gr->base.engine.subdev.device;
         if (info->data) {
                 if (shift >= 0) {
                         info->mmio->addr = addr;
@@ -1021,29 +1021,29 @@ gf100_grctx_mmio_item(struct gf100_grctx *info, u32 addr, u32 data,
                         return;
         }
  
-       nv_wr32(info->priv, addr, data);
+       nvkm_wr32(device, addr, data);
  }
  
  void
  gf100_grctx_generate_bundle(struct gf100_grctx *info)
  {
-       const struct gf100_grctx_oclass *impl = gf100_grctx_impl(info->priv);
+       const struct gf100_grctx_func *grctx = info->gr->func->grctx;
         const u32 access = NV_MEM_ACCESS_RW | NV_MEM_ACCESS_SYS;
         const int s = 8;
-       const int b = mmio_vram(info, impl->bundle_size, (1 << s), access);
+       const int b = mmio_vram(info, grctx->bundle_size, (1 << s), access);
         mmio_refn(info, 0x408004, 0x00000000, s, b);
-       mmio_wr32(info, 0x408008, 0x80000000 | (impl->bundle_size >> s));
+       mmio_wr32(info, 0x408008, 0x80000000 | (grctx->bundle_size >> s));
         mmio_refn(info, 0x418808, 0x00000000, s, b);
-       mmio_wr32(info, 0x41880c, 0x80000000 | (impl->bundle_size >> s));
+       mmio_wr32(info, 0x41880c, 0x80000000 | (grctx->bundle_size >> s));
  }
  
  void
  gf100_grctx_generate_pagepool(struct gf100_grctx *info)
  {
-       const struct gf100_grctx_oclass *impl = gf100_grctx_impl(info->priv);
+       const struct gf100_grctx_func *grctx = info->gr->func->grctx;
         const u32 access = NV_MEM_ACCESS_RW | NV_MEM_ACCESS_SYS;
         const int s = 8;
-       const int b = mmio_vram(info, impl->pagepool_size, (1 << s), access);
+       const int b = mmio_vram(info, grctx->pagepool_size, (1 << s), access);
         mmio_refn(info, 0x40800c, 0x00000000, s, b);
         mmio_wr32(info, 0x408010, 0x80000000);
         mmio_refn(info, 0x419004, 0x00000000, s, b);
@@ -1053,13 +1053,13 @@ gf100_grctx_generate_pagepool(struct gf100_grctx *info)
  void
  gf100_grctx_generate_attrib(struct gf100_grctx *info)
  {
-       struct gf100_gr_priv *priv = info->priv;
-       const struct gf100_grctx_oclass *impl = gf100_grctx_impl(priv);
-       const u32 attrib = impl->attrib_nr;
-       const u32   size = 0x20 * (impl->attrib_nr_max + impl->alpha_nr_max);
+       struct gf100_gr *gr = info->gr;
+       const struct gf100_grctx_func *grctx = gr->func->grctx;
+       const u32 attrib = grctx->attrib_nr;
+       const u32   size = 0x20 * (grctx->attrib_nr_max + grctx->alpha_nr_max);
         const u32 access = NV_MEM_ACCESS_RW;
         const int s = 12;
-       const int b = mmio_vram(info, size * priv->tpc_total, (1 << s), access);
+       const int b = mmio_vram(info, size * gr->tpc_total, (1 << s), access);
         int gpc, tpc;
         u32 bo = 0;
  
@@ -1067,91 +1067,95 @@ gf100_grctx_generate_attrib(struct gf100_grctx *info)
         mmio_refn(info, 0x419848, 0x10000000, s, b);
         mmio_wr32(info, 0x405830, (attrib << 16));
  
-       for (gpc = 0; gpc < priv->gpc_nr; gpc++) {
-               for (tpc = 0; tpc < priv->tpc_nr[gpc]; tpc++) {
+       for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
+               for (tpc = 0; tpc < gr->tpc_nr[gpc]; tpc++) {
                         const u32 o = TPC_UNIT(gpc, tpc, 0x0520);
                         mmio_skip(info, o, (attrib << 16) | ++bo);
                         mmio_wr32(info, o, (attrib << 16) | --bo);
-                       bo += impl->attrib_nr_max;
+                       bo += grctx->attrib_nr_max;
                 }
         }
  }
  
  void
-gf100_grctx_generate_unkn(struct gf100_gr_priv *priv)
+gf100_grctx_generate_unkn(struct gf100_gr *gr)
  {
  }
  
  void
-gf100_grctx_generate_tpcid(struct gf100_gr_priv *priv)
+gf100_grctx_generate_tpcid(struct gf100_gr *gr)
  {
+       struct nvkm_device *device = gr->base.engine.subdev.device;
         int gpc, tpc, id;
  
         for (tpc = 0, id = 0; tpc < 4; tpc++) {
-               for (gpc = 0; gpc < priv->gpc_nr; gpc++) {
-                       if (tpc < priv->tpc_nr[gpc]) {
-                               nv_wr32(priv, TPC_UNIT(gpc, tpc, 0x698), id);
-                               nv_wr32(priv, TPC_UNIT(gpc, tpc, 0x4e8), id);
-                               nv_wr32(priv, GPC_UNIT(gpc, 0x0c10 + tpc * 4), id);
-                               nv_wr32(priv, TPC_UNIT(gpc, tpc, 0x088), id);
+               for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
+                       if (tpc < gr->tpc_nr[gpc]) {
+                               nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x698), id);
+                               nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x4e8), id);
+                               nvkm_wr32(device, GPC_UNIT(gpc, 0x0c10 + tpc * 4), id);
+                               nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x088), id);
                                 id++;
                         }
  
-                       nv_wr32(priv, GPC_UNIT(gpc, 0x0c08), priv->tpc_nr[gpc]);
-                       nv_wr32(priv, GPC_UNIT(gpc, 0x0c8c), priv->tpc_nr[gpc]);
+                       nvkm_wr32(device, GPC_UNIT(gpc, 0x0c08), gr->tpc_nr[gpc]);
+                       nvkm_wr32(device, GPC_UNIT(gpc, 0x0c8c), gr->tpc_nr[gpc]);
                 }
         }
  }
  
  void
-gf100_grctx_generate_r406028(struct gf100_gr_priv *priv)
+gf100_grctx_generate_r406028(struct gf100_gr *gr)
  {
+       struct nvkm_device *device = gr->base.engine.subdev.device;
         u32 tmp[GPC_MAX / 8] = {}, i = 0;
-       for (i = 0; i < priv->gpc_nr; i++)
-               tmp[i / 8] |= priv->tpc_nr[i] << ((i % 8) * 4);
+       for (i = 0; i < gr->gpc_nr; i++)
+               tmp[i / 8] |= gr->tpc_nr[i] << ((i % 8) * 4);
         for (i = 0; i < 4; i++) {
-               nv_wr32(priv, 0x406028 + (i * 4), tmp[i]);
-               nv_wr32(priv, 0x405870 + (i * 4), tmp[i]);
+               nvkm_wr32(device, 0x406028 + (i * 4), tmp[i]);
+               nvkm_wr32(device, 0x405870 + (i * 4), tmp[i]);
         }
  }
  
  void
-gf100_grctx_generate_r4060a8(struct gf100_gr_priv *priv)
+gf100_grctx_generate_r4060a8(struct gf100_gr *gr)
  {
+       struct nvkm_device *device = gr->base.engine.subdev.device;
         u8  tpcnr[GPC_MAX], data[TPC_MAX];
         int gpc, tpc, i;
  
-       memcpy(tpcnr, priv->tpc_nr, sizeof(priv->tpc_nr));
+       memcpy(tpcnr, gr->tpc_nr, sizeof(gr->tpc_nr));
         memset(data, 0x1f, sizeof(data));
  
         gpc = -1;
-       for (tpc = 0; tpc < priv->tpc_total; tpc++) {
+       for (tpc = 0; tpc < gr->tpc_total; tpc++) {
                 do {
-                       gpc = (gpc + 1) % priv->gpc_nr;
+                       gpc = (gpc + 1) % gr->gpc_nr;
                 } while (!tpcnr[gpc]);
                 tpcnr[gpc]--;
                 data[tpc] = gpc;
         }
  
         for (i = 0; i < 4; i++)
-               nv_wr32(priv, 0x4060a8 + (i * 4), ((u32 *)data)[i]);
+               nvkm_wr32(device, 0x4060a8 + (i * 4), ((u32 *)data)[i]);
  }
  
  void
-gf100_grctx_generate_r418bb8(struct gf100_gr_priv *priv)
+gf100_grctx_generate_r418bb8(struct gf100_gr *gr)
  {
+       struct nvkm_device *device = gr->base.engine.subdev.device;
         u32 data[6] = {}, data2[2] = {};
         u8  tpcnr[GPC_MAX];
         u8  shift, ntpcv;
         int gpc, tpc, i;
  
         /* calculate first set of magics */
-       memcpy(tpcnr, priv->tpc_nr, sizeof(priv->tpc_nr));
+       memcpy(tpcnr, gr->tpc_nr, sizeof(gr->tpc_nr));
  
         gpc = -1;
-       for (tpc = 0; tpc < priv->tpc_total; tpc++) {
+       for (tpc = 0; tpc < gr->tpc_total; tpc++) {
                 do {
-                       gpc = (gpc + 1) % priv->gpc_nr;
+                       gpc = (gpc + 1) % gr->gpc_nr;
                 } while (!tpcnr[gpc]);
                 tpcnr[gpc]--;
  
@@ -1163,7 +1167,7 @@ gf100_grctx_generate_r418bb8(struct gf100_gr_priv *priv)
  
         /* and the second... */
         shift = 0;
-       ntpcv = priv->tpc_total;
+       ntpcv = gr->tpc_total;
         while (!(ntpcv & (1 << 4))) {
                 ntpcv <<= 1;
                 shift++;
@@ -1176,202 +1180,211 @@ gf100_grctx_generate_r418bb8(struct gf100_gr_priv *priv)
                 data2[1] |= ((1 << (i + 5)) % ntpcv) << ((i - 1) * 5);
  
         /* GPC_BROADCAST */
-       nv_wr32(priv, 0x418bb8, (priv->tpc_total << 8) |
-                                priv->magic_not_rop_nr);
+       nvkm_wr32(device, 0x418bb8, (gr->tpc_total << 8) |
+                                gr->magic_not_rop_nr);
         for (i = 0; i < 6; i++)
-               nv_wr32(priv, 0x418b08 + (i * 4), data[i]);
+               nvkm_wr32(device, 0x418b08 + (i * 4), data[i]);
  
         /* GPC_BROADCAST.TP_BROADCAST */
-       nv_wr32(priv, 0x419bd0, (priv->tpc_total << 8) |
-                                priv->magic_not_rop_nr | data2[0]);
-       nv_wr32(priv, 0x419be4, data2[1]);
+       nvkm_wr32(device, 0x419bd0, (gr->tpc_total << 8) |
+                                gr->magic_not_rop_nr | data2[0]);
+       nvkm_wr32(device, 0x419be4, data2[1]);
         for (i = 0; i < 6; i++)
-               nv_wr32(priv, 0x419b00 + (i * 4), data[i]);
+               nvkm_wr32(device, 0x419b00 + (i * 4), data[i]);
  
         /* UNK78xx */
-       nv_wr32(priv, 0x4078bc, (priv->tpc_total << 8) |
-                                priv->magic_not_rop_nr);
+       nvkm_wr32(device, 0x4078bc, (gr->tpc_total << 8) |
+                                gr->magic_not_rop_nr);
         for (i = 0; i < 6; i++)
-               nv_wr32(priv, 0x40780c + (i * 4), data[i]);
+               nvkm_wr32(device, 0x40780c + (i * 4), data[i]);
  }
  
  void
-gf100_grctx_generate_r406800(struct gf100_gr_priv *priv)
+gf100_grctx_generate_r406800(struct gf100_gr *gr)
  {
+       struct nvkm_device *device = gr->base.engine.subdev.device;
         u64 tpc_mask = 0, tpc_set = 0;
         u8  tpcnr[GPC_MAX];
         int gpc, tpc;
         int i, a, b;
  
-       memcpy(tpcnr, priv->tpc_nr, sizeof(priv->tpc_nr));
-       for (gpc = 0; gpc < priv->gpc_nr; gpc++)
-               tpc_mask |= ((1ULL << priv->tpc_nr[gpc]) - 1) << (gpc * 8);
+       memcpy(tpcnr, gr->tpc_nr, sizeof(gr->tpc_nr));
+       for (gpc = 0; gpc < gr->gpc_nr; gpc++)
+               tpc_mask |= ((1ULL << gr->tpc_nr[gpc]) - 1) << (gpc * 8);
  
         for (i = 0, gpc = -1, b = -1; i < 32; i++) {
-               a = (i * (priv->tpc_total - 1)) / 32;
+               a = (i * (gr->tpc_total - 1)) / 32;
                 if (a != b) {
                         b = a;
                         do {
-                               gpc = (gpc + 1) % priv->gpc_nr;
+                               gpc = (gpc + 1) % gr->gpc_nr;
                         } while (!tpcnr[gpc]);
-                       tpc = priv->tpc_nr[gpc] - tpcnr[gpc]--;
+                       tpc = gr->tpc_nr[gpc] - tpcnr[gpc]--;
  
                         tpc_set |= 1ULL << ((gpc * 8) + tpc);
                 }
  
-               nv_wr32(priv, 0x406800 + (i * 0x20), lower_32_bits(tpc_set));
-               nv_wr32(priv, 0x406c00 + (i * 0x20), lower_32_bits(tpc_set ^ tpc_mask));
-               if (priv->gpc_nr > 4) {
-                       nv_wr32(priv, 0x406804 + (i * 0x20), upper_32_bits(tpc_set));
-                       nv_wr32(priv, 0x406c04 + (i * 0x20), upper_32_bits(tpc_set ^ tpc_mask));
+               nvkm_wr32(device, 0x406800 + (i * 0x20), lower_32_bits(tpc_set));
+               nvkm_wr32(device, 0x406c00 + (i * 0x20), lower_32_bits(tpc_set ^ tpc_mask));
+               if (gr->gpc_nr > 4) {
+                       nvkm_wr32(device, 0x406804 + (i * 0x20), upper_32_bits(tpc_set));
+                       nvkm_wr32(device, 0x406c04 + (i * 0x20), upper_32_bits(tpc_set ^ tpc_mask));
                 }
         }
  }
  
  void
-gf100_grctx_generate_main(struct gf100_gr_priv *priv, struct gf100_grctx *info)
+gf100_grctx_generate_main(struct gf100_gr *gr, struct gf100_grctx *info)
  {
-       struct gf100_grctx_oclass *oclass = (void *)nv_engine(priv)->cclass;
-
-       nvkm_mc(priv)->unk260(nvkm_mc(priv), 0);
-
-       gf100_gr_mmio(priv, oclass->hub);
-       gf100_gr_mmio(priv, oclass->gpc);
-       gf100_gr_mmio(priv, oclass->zcull);
-       gf100_gr_mmio(priv, oclass->tpc);
-       gf100_gr_mmio(priv, oclass->ppc);
-
-       nv_wr32(priv, 0x404154, 0x00000000);
-
-       oclass->bundle(info);
-       oclass->pagepool(info);
-       oclass->attrib(info);
-       oclass->unkn(priv);
-
-       gf100_grctx_generate_tpcid(priv);
-       gf100_grctx_generate_r406028(priv);
-       gf100_grctx_generate_r4060a8(priv);
-       gf100_grctx_generate_r418bb8(priv);
-       gf100_grctx_generate_r406800(priv);
-
-       gf100_gr_icmd(priv, oclass->icmd);
-       nv_wr32(priv, 0x404154, 0x00000400);
-       gf100_gr_mthd(priv, oclass->mthd);
-       nvkm_mc(priv)->unk260(nvkm_mc(priv), 1);
+       struct nvkm_device *device = gr->base.engine.subdev.device;
+       const struct gf100_grctx_func *grctx = gr->func->grctx;
+
+       nvkm_mc_unk260(device->mc, 0);
+
+       gf100_gr_mmio(gr, grctx->hub);
+       gf100_gr_mmio(gr, grctx->gpc);
+       gf100_gr_mmio(gr, grctx->zcull);
+       gf100_gr_mmio(gr, grctx->tpc);
+       gf100_gr_mmio(gr, grctx->ppc);
+
+       nvkm_wr32(device, 0x404154, 0x00000000);
+
+       grctx->bundle(info);
+       grctx->pagepool(info);
+       grctx->attrib(info);
+       grctx->unkn(gr);
+
+       gf100_grctx_generate_tpcid(gr);
+       gf100_grctx_generate_r406028(gr);
+       gf100_grctx_generate_r4060a8(gr);
+       gf100_grctx_generate_r418bb8(gr);
+       gf100_grctx_generate_r406800(gr);
+
+       gf100_gr_icmd(gr, grctx->icmd);
+       nvkm_wr32(device, 0x404154, 0x00000400);
+       gf100_gr_mthd(gr, grctx->mthd);
+       nvkm_mc_unk260(device->mc, 1);
  }
  
  int
-gf100_grctx_generate(struct gf100_gr_priv *priv)
+gf100_grctx_generate(struct gf100_gr *gr)
  {
-       struct gf100_grctx_oclass *oclass = (void *)nv_engine(priv)->cclass;
-       struct nvkm_bar *bar = nvkm_bar(priv);
-       struct nvkm_gpuobj *chan;
+       const struct gf100_grctx_func *grctx = gr->func->grctx;
+       struct nvkm_subdev *subdev = &gr->base.engine.subdev;
+       struct nvkm_device *device = subdev->device;
+       struct nvkm_memory *chan;
         struct gf100_grctx info;
         int ret, i;
+       u64 addr;
  
         /* allocate memory to for a "channel", which we'll use to generate
          * the default context values
          */
-       ret = nvkm_gpuobj_new(nv_object(priv), NULL, 0x80000 + priv->size,
-                             0x1000, NVOBJ_FLAG_ZERO_ALLOC, &chan);
+       ret = nvkm_memory_new(device, NVKM_MEM_TARGET_INST, 0x80000 + gr->size,
+                             0x1000, true, &chan);
         if (ret) {
-               nv_error(priv, "failed to allocate channel memory, %d\n", ret);
+               nvkm_error(subdev, "failed to allocate chan memory, %d\n", ret);
                 return ret;
         }
  
+       addr = nvkm_memory_addr(chan);
+
         /* PGD pointer */
-       nv_wo32(chan, 0x0200, lower_32_bits(chan->addr + 0x1000));
-       nv_wo32(chan, 0x0204, upper_32_bits(chan->addr + 0x1000));
-       nv_wo32(chan, 0x0208, 0xffffffff);
-       nv_wo32(chan, 0x020c, 0x000000ff);
+       nvkm_kmap(chan);
+       nvkm_wo32(chan, 0x0200, lower_32_bits(addr + 0x1000));
+       nvkm_wo32(chan, 0x0204, upper_32_bits(addr + 0x1000));
+       nvkm_wo32(chan, 0x0208, 0xffffffff);
+       nvkm_wo32(chan, 0x020c, 0x000000ff);
  
         /* PGT[0] pointer */
-       nv_wo32(chan, 0x1000, 0x00000000);
-       nv_wo32(chan, 0x1004, 0x00000001 | (chan->addr + 0x2000) >> 8);
+       nvkm_wo32(chan, 0x1000, 0x00000000);
+       nvkm_wo32(chan, 0x1004, 0x00000001 | (addr + 0x2000) >> 8);
  
         /* identity-map the whole "channel" into its own vm */
-       for (i = 0; i < chan->size / 4096; i++) {
-               u64 addr = ((chan->addr + (i * 4096)) >> 8) | 1;
-               nv_wo32(chan, 0x2000 + (i * 8), lower_32_bits(addr));
-               nv_wo32(chan, 0x2004 + (i * 8), upper_32_bits(addr));
+       for (i = 0; i < nvkm_memory_size(chan) / 4096; i++) {
+               u64 addr = ((nvkm_memory_addr(chan) + (i * 4096)) >> 8) | 1;
+               nvkm_wo32(chan, 0x2000 + (i * 8), lower_32_bits(addr));
+               nvkm_wo32(chan, 0x2004 + (i * 8), upper_32_bits(addr));
         }
  
         /* context pointer (virt) */
-       nv_wo32(chan, 0x0210, 0x00080004);
-       nv_wo32(chan, 0x0214, 0x00000000);
+       nvkm_wo32(chan, 0x0210, 0x00080004);
+       nvkm_wo32(chan, 0x0214, 0x00000000);
+       nvkm_done(chan);
  
-       bar->flush(bar);
-
-       nv_wr32(priv, 0x100cb8, (chan->addr + 0x1000) >> 8);
-       nv_wr32(priv, 0x100cbc, 0x80000001);
-       nv_wait(priv, 0x100c80, 0x00008000, 0x00008000);
+       nvkm_wr32(device, 0x100cb8, (addr + 0x1000) >> 8);
+       nvkm_wr32(device, 0x100cbc, 0x80000001);
+       nvkm_msec(device, 2000,
+               if (nvkm_rd32(device, 0x100c80) & 0x00008000)
+                       break;
+       );
  
         /* setup default state for mmio list construction */
-       info.priv = priv;
-       info.data = priv->mmio_data;
-       info.mmio = priv->mmio_list;
+       info.gr = gr;
+       info.data = gr->mmio_data;
+       info.mmio = gr->mmio_list;
         info.addr = 0x2000 + (i * 8);
         info.buffer_nr = 0;
  
         /* make channel current */
-       if (priv->firmware) {
-               nv_wr32(priv, 0x409840, 0x00000030);
-               nv_wr32(priv, 0x409500, 0x80000000 | chan->addr >> 12);
-               nv_wr32(priv, 0x409504, 0x00000003);
-               if (!nv_wait(priv, 0x409800, 0x00000010, 0x00000010))
-                       nv_error(priv, "load_ctx timeout\n");
-
-               nv_wo32(chan, 0x8001c, 1);
-               nv_wo32(chan, 0x80020, 0);
-               nv_wo32(chan, 0x80028, 0);
-               nv_wo32(chan, 0x8002c, 0);
-               bar->flush(bar);
+       if (gr->firmware) {
+               nvkm_wr32(device, 0x409840, 0x00000030);
+               nvkm_wr32(device, 0x409500, 0x80000000 | addr >> 12);
+               nvkm_wr32(device, 0x409504, 0x00000003);
+               nvkm_msec(device, 2000,
+                       if (nvkm_rd32(device, 0x409800) & 0x00000010)
+                               break;
+               );
+
+               nvkm_kmap(chan);
+               nvkm_wo32(chan, 0x8001c, 1);
+               nvkm_wo32(chan, 0x80020, 0);
+               nvkm_wo32(chan, 0x80028, 0);
+               nvkm_wo32(chan, 0x8002c, 0);
+               nvkm_done(chan);
         } else {
-               nv_wr32(priv, 0x409840, 0x80000000);
-               nv_wr32(priv, 0x409500, 0x80000000 | chan->addr >> 12);
-               nv_wr32(priv, 0x409504, 0x00000001);
-               if (!nv_wait(priv, 0x409800, 0x80000000, 0x80000000))
-                       nv_error(priv, "HUB_SET_CHAN timeout\n");
+               nvkm_wr32(device, 0x409840, 0x80000000);
+               nvkm_wr32(device, 0x409500, 0x80000000 | addr >> 12);
+               nvkm_wr32(device, 0x409504, 0x00000001);
+               nvkm_msec(device, 2000,
+                       if (nvkm_rd32(device, 0x409800) & 0x80000000)
+                               break;
+               );
         }
  
-       oclass->main(priv, &info);
+       grctx->main(gr, &info);
  
         /* trigger a context unload by unsetting the "next channel valid" bit
          * and faking a context switch interrupt
          */
-       nv_mask(priv, 0x409b04, 0x80000000, 0x00000000);
-       nv_wr32(priv, 0x409000, 0x00000100);
-       if (!nv_wait(priv, 0x409b00, 0x80000000, 0x00000000)) {
-               nv_error(priv, "grctx template channel unload timeout\n");
+       nvkm_mask(device, 0x409b04, 0x80000000, 0x00000000);
+       nvkm_wr32(device, 0x409000, 0x00000100);
+       if (nvkm_msec(device, 2000,
+               if (!(nvkm_rd32(device, 0x409b00) & 0x80000000))
+                       break;
+       ) < 0) {
                 ret = -EBUSY;
                 goto done;
         }
  
-       priv->data = kmalloc(priv->size, GFP_KERNEL);
-       if (priv->data) {
-               for (i = 0; i < priv->size; i += 4)
-                       priv->data[i / 4] = nv_ro32(chan, 0x80000 + i);
+       gr->data = kmalloc(gr->size, GFP_KERNEL);
+       if (gr->data) {
+               nvkm_kmap(chan);
+               for (i = 0; i < gr->size; i += 4)
+                       gr->data[i / 4] = nvkm_ro32(chan, 0x80000 + i);
+               nvkm_done(chan);
                 ret = 0;
         } else {
                 ret = -ENOMEM;
         }
  
  done:
-       nvkm_gpuobj_ref(NULL, &chan);
+       nvkm_memory_del(&chan);
         return ret;
  }
  
-struct nvkm_oclass *
-gf100_grctx_oclass = &(struct gf100_grctx_oclass) {
-       .base.handle = NV_ENGCTX(GR, 0xc0),
-       .base.ofuncs = &(struct nvkm_ofuncs) {
-               .ctor = gf100_gr_context_ctor,
-               .dtor = gf100_gr_context_dtor,
-               .init = _nvkm_gr_context_init,
-               .fini = _nvkm_gr_context_fini,
-               .rd32 = _nvkm_gr_context_rd32,
-               .wr32 = _nvkm_gr_context_wr32,
-       },
+const struct gf100_grctx_func
+gf100_grctx = {
         .main  = gf100_grctx_generate_main,
         .unkn  = gf100_grctx_generate_unkn,
         .hub   = gf100_grctx_pack_hub,
@@ -1387,4 +1400,4 @@ gf100_grctx_oclass = &(struct gf100_grctx_oclass) {
         .attrib = gf100_grctx_generate_attrib,
         .attrib_nr_max = 0x324,
         .attrib_nr = 0x218,
-}.base;
+};