drivers/gpu/drm/nouveau/nouveau_object.c

   1 /*
   2  * Copyright (C) 2006 Ben Skeggs.
   3  *
   4  * All Rights Reserved.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining
   7  * a copy of this software and associated documentation files (the
   8  * "Software"), to deal in the Software without restriction, including
   9  * without limitation the rights to use, copy, modify, merge, publish,
  10  * distribute, sublicense, and/or sell copies of the Software, and to
  11  * permit persons to whom the Software is furnished to do so, subject to
  12  * the following conditions:
  13  *
  14  * The above copyright notice and this permission notice (including the
  15  * next paragraph) shall be included in all copies or substantial
  16  * portions of the Software.
  17  *
  18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  19  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  21  * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  22  * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  23  * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  24  * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25  *
  26  */
  27
  28 /*
  29  * Authors:
  30  *   Ben Skeggs <darktama@iinet.net.au>
  31  */
  32
  33 #include "drmP.h"
  34 #include "drm.h"
  35 #include "nouveau_drv.h"
  36 #include "nouveau_drm.h"
  37 #include "nouveau_ramht.h"
  38 #include "nouveau_vm.h"
  39 #include "nv50_display.h"
  40
  41 struct nouveau_gpuobj_method {
  42         struct list_head head;
  43         u32 mthd;
  44         int (*exec)(struct nouveau_channel *, u32 class, u32 mthd, u32 data);
  45 };
  46
  47 struct nouveau_gpuobj_class {
  48         struct list_head head;
  49         struct list_head methods;
  50         u32 id;
  51         u32 engine;
  52 };
  53
  54 int
  55 nouveau_gpuobj_class_new(struct drm_device *dev, u32 class, u32 engine)
  56 {
  57         struct drm_nouveau_private *dev_priv = dev->dev_private;
  58         struct nouveau_gpuobj_class *oc;
  59
  60         oc = kzalloc(sizeof(*oc), GFP_KERNEL);
  61         if (!oc)
  62                 return -ENOMEM;
  63
  64         INIT_LIST_HEAD(&oc->methods);
  65         oc->id = class;
  66         oc->engine = engine;
  67         list_add(&oc->head, &dev_priv->classes);
  68         return 0;
  69 }
  70
  71 int
  72 nouveau_gpuobj_mthd_new(struct drm_device *dev, u32 class, u32 mthd,
  73                         int (*exec)(struct nouveau_channel *, u32, u32, u32))
  74 {
  75         struct drm_nouveau_private *dev_priv = dev->dev_private;
  76         struct nouveau_gpuobj_method *om;
  77         struct nouveau_gpuobj_class *oc;
  78
  79         list_for_each_entry(oc, &dev_priv->classes, head) {
  80                 if (oc->id == class)
  81                         goto found;
  82         }
  83
  84         return -EINVAL;
  85
  86 found:
  87         om = kzalloc(sizeof(*om), GFP_KERNEL);
  88         if (!om)
  89                 return -ENOMEM;
  90
  91         om->mthd = mthd;
  92         om->exec = exec;
  93         list_add(&om->head, &oc->methods);
  94         return 0;
  95 }
  96
  97 int
  98 nouveau_gpuobj_mthd_call(struct nouveau_channel *chan,
  99                          u32 class, u32 mthd, u32 data)
 100 {
 101         struct drm_nouveau_private *dev_priv = chan->dev->dev_private;
 102         struct nouveau_gpuobj_method *om;
 103         struct nouveau_gpuobj_class *oc;
 104
 105         list_for_each_entry(oc, &dev_priv->classes, head) {
 106                 if (oc->id != class)
 107                         continue;
 108
 109                 list_for_each_entry(om, &oc->methods, head) {
 110                         if (om->mthd == mthd)
 111                                 return om->exec(chan, class, mthd, data);
 112                 }
 113         }
 114
 115         return -ENOENT;
 116 }
 117
 118 int
 119 nouveau_gpuobj_mthd_call2(struct drm_device *dev, int chid,
 120                           u32 class, u32 mthd, u32 data)
 121 {
 122         struct drm_nouveau_private *dev_priv = dev->dev_private;
 123         struct nouveau_channel *chan = NULL;
 124         unsigned long flags;
 125         int ret = -EINVAL;
 126
 127         spin_lock_irqsave(&dev_priv->channels.lock, flags);
 128         if (chid > 0 && chid < dev_priv->engine.fifo.channels)
 129                 chan = dev_priv->channels.ptr[chid];
 130         if (chan)
 131                 ret = nouveau_gpuobj_mthd_call(chan, class, mthd, data);
 132         spin_unlock_irqrestore(&dev_priv->channels.lock, flags);
 133         return ret;
 134 }
 135
 136 /* NVidia uses context objects to drive drawing operations.
 137
 138    Context objects can be selected into 8 subchannels in the FIFO,
 139    and then used via DMA command buffers.
 140
 141    A context object is referenced by a user defined handle (CARD32). The HW
 142    looks up graphics objects in a hash table in the instance RAM.
 143
 144    An entry in the hash table consists of 2 CARD32. The first CARD32 contains
 145    the handle, the second one a bitfield, that contains the address of the
 146    object in instance RAM.
 147
 148    The format of the second CARD32 seems to be:
 149
 150    NV4 to NV30:
 151
 152    15: 0  instance_addr >> 4
 153    17:16  engine (here uses 1 = graphics)
 154    28:24  channel id (here uses 0)
 155    31     valid (use 1)
 156
 157    NV40:
 158
 159    15: 0  instance_addr >> 4   (maybe 19-0)
 160    21:20  engine (here uses 1 = graphics)
 161    I'm unsure about the other bits, but using 0 seems to work.
 162
 163    The key into the hash table depends on the object handle and channel id and
 164    is given as:
 165 */
 166
 167 int
 168 nouveau_gpuobj_new(struct drm_device *dev, struct nouveau_channel *chan,
 169                    uint32_t size, int align, uint32_t flags,
 170                    struct nouveau_gpuobj **gpuobj_ret)
 171 {
 172         struct drm_nouveau_private *dev_priv = dev->dev_private;
 173         struct nouveau_instmem_engine *instmem = &dev_priv->engine.instmem;
 174         struct nouveau_gpuobj *gpuobj;
 175         struct drm_mm_node *ramin = NULL;
 176         int ret, i;
 177
 178         NV_DEBUG(dev, "ch%d size=%u align=%d flags=0x%08x\n",
 179                  chan ? chan->id : -1, size, align, flags);
 180
 181         gpuobj = kzalloc(sizeof(*gpuobj), GFP_KERNEL);
 182         if (!gpuobj)
 183                 return -ENOMEM;
 184         NV_DEBUG(dev, "gpuobj %p\n", gpuobj);
 185         gpuobj->dev = dev;
 186         gpuobj->flags = flags;
 187         kref_init(&gpuobj->refcount);
 188         gpuobj->size = size;
 189
 190         spin_lock(&dev_priv->ramin_lock);
 191         list_add_tail(&gpuobj->list, &dev_priv->gpuobj_list);
 192         spin_unlock(&dev_priv->ramin_lock);
 193
 194         if (chan) {
 195                 ramin = drm_mm_search_free(&chan->ramin_heap, size, align, 0);
 196                 if (ramin)
 197                         ramin = drm_mm_get_block(ramin, size, align);
 198                 if (!ramin) {
 199                         nouveau_gpuobj_ref(NULL, &gpuobj);
 200                         return -ENOMEM;
 201                 }
 202
 203                 gpuobj->pinst = chan->ramin->pinst;
 204                 if (gpuobj->pinst != ~0)
 205                         gpuobj->pinst += ramin->start;
 206
 207                 gpuobj->cinst = ramin->start;
 208                 gpuobj->vinst = ramin->start + chan->ramin->vinst;
 209                 gpuobj->node  = ramin;
 210         } else {
 211                 ret = instmem->get(gpuobj, size, align);
 212                 if (ret) {
 213                         nouveau_gpuobj_ref(NULL, &gpuobj);
 214                         return ret;
 215                 }
 216
 217                 ret = -ENOSYS;
 218                 if (!(flags & NVOBJ_FLAG_DONT_MAP))
 219                         ret = instmem->map(gpuobj);
 220                 if (ret)
 221                         gpuobj->pinst = ~0;
 222
 223                 gpuobj->cinst = NVOBJ_CINST_GLOBAL;
 224         }
 225
 226         if (gpuobj->flags & NVOBJ_FLAG_ZERO_ALLOC) {
 227                 for (i = 0; i < gpuobj->size; i += 4)
 228                         nv_wo32(gpuobj, i, 0);
 229                 instmem->flush(dev);
 230         }
 231
 232
 233         *gpuobj_ret = gpuobj;
 234         return 0;
 235 }
 236
 237 int
 238 nouveau_gpuobj_init(struct drm_device *dev)
 239 {
 240         struct drm_nouveau_private *dev_priv = dev->dev_private;
 241
 242         NV_DEBUG(dev, "\n");
 243
 244         INIT_LIST_HEAD(&dev_priv->gpuobj_list);
 245         INIT_LIST_HEAD(&dev_priv->classes);
 246         spin_lock_init(&dev_priv->ramin_lock);
 247         dev_priv->ramin_base = ~0;
 248
 249         return 0;
 250 }
 251
 252 void
 253 nouveau_gpuobj_takedown(struct drm_device *dev)
 254 {
 255         struct drm_nouveau_private *dev_priv = dev->dev_private;
 256         struct nouveau_gpuobj_method *om, *tm;
 257         struct nouveau_gpuobj_class *oc, *tc;
 258
 259         NV_DEBUG(dev, "\n");
 260
 261         list_for_each_entry_safe(oc, tc, &dev_priv->classes, head) {
 262                 list_for_each_entry_safe(om, tm, &oc->methods, head) {
 263                         list_del(&om->head);
 264                         kfree(om);
 265                 }
 266                 list_del(&oc->head);
 267                 kfree(oc);
 268         }
 269
 270         BUG_ON(!list_empty(&dev_priv->gpuobj_list));
 271 }
 272
 273
 274 static void
 275 nouveau_gpuobj_del(struct kref *ref)
 276 {
 277         struct nouveau_gpuobj *gpuobj =
 278                 container_of(ref, struct nouveau_gpuobj, refcount);
 279         struct drm_device *dev = gpuobj->dev;
 280         struct drm_nouveau_private *dev_priv = dev->dev_private;
 281         struct nouveau_instmem_engine *instmem = &dev_priv->engine.instmem;
 282         int i;
 283
 284         NV_DEBUG(dev, "gpuobj %p\n", gpuobj);
 285
 286         if (gpuobj->node && (gpuobj->flags & NVOBJ_FLAG_ZERO_FREE)) {
 287                 for (i = 0; i < gpuobj->size; i += 4)
 288                         nv_wo32(gpuobj, i, 0);
 289                 instmem->flush(dev);
 290         }
 291
 292         if (gpuobj->dtor)
 293                 gpuobj->dtor(dev, gpuobj);
 294
 295         if (gpuobj->cinst == NVOBJ_CINST_GLOBAL) {
 296                 if (gpuobj->node) {
 297                         instmem->unmap(gpuobj);
 298                         instmem->put(gpuobj);
 299                 }
 300         } else {
 301                 if (gpuobj->node) {
 302                         spin_lock(&dev_priv->ramin_lock);
 303                         drm_mm_put_block(gpuobj->node);
 304                         spin_unlock(&dev_priv->ramin_lock);
 305                 }
 306         }
 307
 308         spin_lock(&dev_priv->ramin_lock);
 309         list_del(&gpuobj->list);
 310         spin_unlock(&dev_priv->ramin_lock);
 311
 312         kfree(gpuobj);
 313 }
 314
 315 void
 316 nouveau_gpuobj_ref(struct nouveau_gpuobj *ref, struct nouveau_gpuobj **ptr)
 317 {
 318         if (ref)
 319                 kref_get(&ref->refcount);
 320
 321         if (*ptr)
 322                 kref_put(&(*ptr)->refcount, nouveau_gpuobj_del);
 323
 324         *ptr = ref;
 325 }
 326
 327 int
 328 nouveau_gpuobj_new_fake(struct drm_device *dev, u32 pinst, u64 vinst,
 329                         u32 size, u32 flags, struct nouveau_gpuobj **pgpuobj)
 330 {
 331         struct drm_nouveau_private *dev_priv = dev->dev_private;
 332         struct nouveau_gpuobj *gpuobj = NULL;
 333         int i;
 334
 335         NV_DEBUG(dev,
 336                  "pinst=0x%08x vinst=0x%010llx size=0x%08x flags=0x%08x\n",
 337                  pinst, vinst, size, flags);
 338
 339         gpuobj = kzalloc(sizeof(*gpuobj), GFP_KERNEL);
 340         if (!gpuobj)
 341                 return -ENOMEM;
 342         NV_DEBUG(dev, "gpuobj %p\n", gpuobj);
 343         gpuobj->dev = dev;
 344         gpuobj->flags = flags;
 345         kref_init(&gpuobj->refcount);
 346         gpuobj->size  = size;
 347         gpuobj->pinst = pinst;
 348         gpuobj->cinst = NVOBJ_CINST_GLOBAL;
 349         gpuobj->vinst = vinst;
 350
 351         if (gpuobj->flags & NVOBJ_FLAG_ZERO_ALLOC) {
 352                 for (i = 0; i < gpuobj->size; i += 4)
 353                         nv_wo32(gpuobj, i, 0);
 354                 dev_priv->engine.instmem.flush(dev);
 355         }
 356
 357         spin_lock(&dev_priv->ramin_lock);
 358         list_add_tail(&gpuobj->list, &dev_priv->gpuobj_list);
 359         spin_unlock(&dev_priv->ramin_lock);
 360         *pgpuobj = gpuobj;
 361         return 0;
 362 }
 363
 364 /*
 365    DMA objects are used to reference a piece of memory in the
 366    framebuffer, PCI or AGP address space. Each object is 16 bytes big
 367    and looks as follows:
 368
 369    entry[0]
 370    11:0  class (seems like I can always use 0 here)
 371    12    page table present?
 372    13    page entry linear?
 373    15:14 access: 0 rw, 1 ro, 2 wo
 374    17:16 target: 0 NV memory, 1 NV memory tiled, 2 PCI, 3 AGP
 375    31:20 dma adjust (bits 0-11 of the address)
 376    entry[1]
 377    dma limit (size of transfer)
 378    entry[X]
 379    1     0 readonly, 1 readwrite
 380    31:12 dma frame address of the page (bits 12-31 of the address)
 381    entry[N]
 382    page table terminator, same value as the first pte, as does nvidia
 383    rivatv uses 0xffffffff
 384
 385    Non linear page tables need a list of frame addresses afterwards,
 386    the rivatv project has some info on this.
 387
 388    The method below creates a DMA object in instance RAM and returns a handle
 389    to it that can be used to set up context objects.
 390 */
 391
 392 void
 393 nv50_gpuobj_dma_init(struct nouveau_gpuobj *obj, u32 offset, int class,
 394                      u64 base, u64 size, int target, int access,
 395                      u32 type, u32 comp)
 396 {
 397         struct drm_nouveau_private *dev_priv = obj->dev->dev_private;
 398         struct nouveau_instmem_engine *pinstmem = &dev_priv->engine.instmem;
 399         u32 flags0;
 400
 401         flags0  = (comp << 29) | (type << 22) | class;
 402         flags0 |= 0x00100000;
 403
 404         switch (access) {
 405         case NV_MEM_ACCESS_RO: flags0 |= 0x00040000; break;
 406         case NV_MEM_ACCESS_RW:
 407         case NV_MEM_ACCESS_WO: flags0 |= 0x00080000; break;
 408         default:
 409                 break;
 410         }
 411
 412         switch (target) {
 413         case NV_MEM_TARGET_VRAM:
 414                 flags0 |= 0x00010000;
 415                 break;
 416         case NV_MEM_TARGET_PCI:
 417                 flags0 |= 0x00020000;
 418                 break;
 419         case NV_MEM_TARGET_PCI_NOSNOOP:
 420                 flags0 |= 0x00030000;
 421                 break;
 422         case NV_MEM_TARGET_GART:
 423                 base += dev_priv->gart_info.aper_base;
 424         default:
 425                 flags0 &= ~0x00100000;
 426                 break;
 427         }
 428
 429         /* convert to base + limit */
 430         size = (base + size) - 1;
 431
 432         nv_wo32(obj, offset + 0x00, flags0);
 433         nv_wo32(obj, offset + 0x04, lower_32_bits(size));
 434         nv_wo32(obj, offset + 0x08, lower_32_bits(base));
 435         nv_wo32(obj, offset + 0x0c, upper_32_bits(size) << 24 |
 436                                     upper_32_bits(base));
 437         nv_wo32(obj, offset + 0x10, 0x00000000);
 438         nv_wo32(obj, offset + 0x14, 0x00000000);
 439
 440         pinstmem->flush(obj->dev);
 441 }
 442
 443 int
 444 nv50_gpuobj_dma_new(struct nouveau_channel *chan, int class, u64 base, u64 size,
 445                     int target, int access, u32 type, u32 comp,
 446                     struct nouveau_gpuobj **pobj)
 447 {
 448         struct drm_device *dev = chan->dev;
 449         int ret;
 450
 451         ret = nouveau_gpuobj_new(dev, chan, 24, 16, NVOBJ_FLAG_ZERO_FREE, pobj);
 452         if (ret)
 453                 return ret;
 454
 455         nv50_gpuobj_dma_init(*pobj, 0, class, base, size, target,
 456                              access, type, comp);
 457         return 0;
 458 }
 459
 460 int
 461 nouveau_gpuobj_dma_new(struct nouveau_channel *chan, int class, u64 base,
 462                        u64 size, int access, int target,
 463                        struct nouveau_gpuobj **pobj)
 464 {
 465         struct drm_nouveau_private *dev_priv = chan->dev->dev_private;
 466         struct drm_device *dev = chan->dev;
 467         struct nouveau_gpuobj *obj;
 468         u32 flags0, flags2;
 469         int ret;
 470
 471         if (dev_priv->card_type >= NV_50) {
 472                 u32 comp = (target == NV_MEM_TARGET_VM) ? NV_MEM_COMP_VM : 0;
 473                 u32 type = (target == NV_MEM_TARGET_VM) ? NV_MEM_TYPE_VM : 0;
 474
 475                 return nv50_gpuobj_dma_new(chan, class, base, size,
 476                                            target, access, type, comp, pobj);
 477         }
 478
 479         if (target == NV_MEM_TARGET_GART) {
 480                 struct nouveau_gpuobj *gart = dev_priv->gart_info.sg_ctxdma;
 481
 482                 if (dev_priv->gart_info.type == NOUVEAU_GART_PDMA) {
 483                         if (base == 0) {
 484                                 nouveau_gpuobj_ref(gart, pobj);
 485                                 return 0;
 486                         }
 487
 488                         base   = nouveau_sgdma_get_physical(dev, base);
 489                         target = NV_MEM_TARGET_PCI;
 490                 } else {
 491                         base += dev_priv->gart_info.aper_base;
 492                         if (dev_priv->gart_info.type == NOUVEAU_GART_AGP)
 493                                 target = NV_MEM_TARGET_PCI_NOSNOOP;
 494                         else
 495                                 target = NV_MEM_TARGET_PCI;
 496                 }
 497         }
 498
 499         flags0  = class;
 500         flags0 |= 0x00003000; /* PT present, PT linear */
 501         flags2  = 0;
 502
 503         switch (target) {
 504         case NV_MEM_TARGET_PCI:
 505                 flags0 |= 0x00020000;
 506                 break;
 507         case NV_MEM_TARGET_PCI_NOSNOOP:
 508                 flags0 |= 0x00030000;
 509                 break;
 510         default:
 511                 break;
 512         }
 513
 514         switch (access) {
 515         case NV_MEM_ACCESS_RO:
 516                 flags0 |= 0x00004000;
 517                 break;
 518         case NV_MEM_ACCESS_WO:
 519                 flags0 |= 0x00008000;
 520         default:
 521                 flags2 |= 0x00000002;
 522                 break;
 523         }
 524
 525         flags0 |= (base & 0x00000fff) << 20;
 526         flags2 |= (base & 0xfffff000);
 527
 528         ret = nouveau_gpuobj_new(dev, chan, 16, 16, NVOBJ_FLAG_ZERO_FREE, &obj);
 529         if (ret)
 530                 return ret;
 531
 532         nv_wo32(obj, 0x00, flags0);
 533         nv_wo32(obj, 0x04, size - 1);
 534         nv_wo32(obj, 0x08, flags2);
 535         nv_wo32(obj, 0x0c, flags2);
 536
 537         obj->engine = NVOBJ_ENGINE_SW;
 538         obj->class  = class;
 539         *pobj = obj;
 540         return 0;
 541 }
 542
 543 /* Context objects in the instance RAM have the following structure.
 544  * On NV40 they are 32 byte long, on NV30 and smaller 16 bytes.
 545
 546    NV4 - NV30:
 547
 548    entry[0]
 549    11:0 class
 550    12   chroma key enable
 551    13   user clip enable
 552    14   swizzle enable
 553    17:15 patch config:
 554        scrcopy_and, rop_and, blend_and, scrcopy, srccopy_pre, blend_pre
 555    18   synchronize enable
 556    19   endian: 1 big, 0 little
 557    21:20 dither mode
 558    23    single step enable
 559    24    patch status: 0 invalid, 1 valid
 560    25    context_surface 0: 1 valid
 561    26    context surface 1: 1 valid
 562    27    context pattern: 1 valid
 563    28    context rop: 1 valid
 564    29,30 context beta, beta4
 565    entry[1]
 566    7:0   mono format
 567    15:8  color format
 568    31:16 notify instance address
 569    entry[2]
 570    15:0  dma 0 instance address
 571    31:16 dma 1 instance address
 572    entry[3]
 573    dma method traps
 574
 575    NV40:
 576    No idea what the exact format is. Here's what can be deducted:
 577
 578    entry[0]:
 579    11:0  class  (maybe uses more bits here?)
 580    17    user clip enable
 581    21:19 patch config
 582    25    patch status valid ?
 583    entry[1]:
 584    15:0  DMA notifier  (maybe 20:0)
 585    entry[2]:
 586    15:0  DMA 0 instance (maybe 20:0)
 587    24    big endian
 588    entry[3]:
 589    15:0  DMA 1 instance (maybe 20:0)
 590    entry[4]:
 591    entry[5]:
 592    set to 0?
 593 */
 594 static int
 595 nouveau_gpuobj_sw_new(struct nouveau_channel *chan, u32 handle, u16 class)
 596 {
 597         struct drm_nouveau_private *dev_priv = chan->dev->dev_private;
 598         struct nouveau_gpuobj *gpuobj;
 599         int ret;
 600
 601         gpuobj = kzalloc(sizeof(*gpuobj), GFP_KERNEL);
 602         if (!gpuobj)
 603                 return -ENOMEM;
 604         gpuobj->dev = chan->dev;
 605         gpuobj->engine = NVOBJ_ENGINE_SW;
 606         gpuobj->class = class;
 607         kref_init(&gpuobj->refcount);
 608         gpuobj->cinst = 0x40;
 609
 610         spin_lock(&dev_priv->ramin_lock);
 611         list_add_tail(&gpuobj->list, &dev_priv->gpuobj_list);
 612         spin_unlock(&dev_priv->ramin_lock);
 613
 614         ret = nouveau_ramht_insert(chan, handle, gpuobj);
 615         nouveau_gpuobj_ref(NULL, &gpuobj);
 616         return ret;
 617 }
 618
 619 int
 620 nouveau_gpuobj_gr_new(struct nouveau_channel *chan, u32 handle, int class)
 621 {
 622         struct drm_nouveau_private *dev_priv = chan->dev->dev_private;
 623         struct nouveau_pgraph_engine *pgraph = &dev_priv->engine.graph;
 624         struct drm_device *dev = chan->dev;
 625         struct nouveau_gpuobj_class *oc;
 626         int ret;
 627
 628         NV_DEBUG(dev, "ch%d class=0x%04x\n", chan->id, class);
 629
 630         list_for_each_entry(oc, &dev_priv->classes, head) {
 631                 if (oc->id == class)
 632                         goto found;
 633         }
 634
 635         NV_ERROR(dev, "illegal object class: 0x%x\n", class);
 636         return -EINVAL;
 637
 638 found:
 639         switch (oc->engine) {
 640         case NVOBJ_ENGINE_SW:
 641                 return nouveau_gpuobj_sw_new(chan, handle, class);
 642         case NVOBJ_ENGINE_GR:
 643                 if ((dev_priv->card_type >= NV_20 && !chan->ramin_grctx) ||
 644                     (dev_priv->card_type  < NV_20 && !chan->pgraph_ctx)) {
 645                         ret = pgraph->create_context(chan);
 646                         if (ret)
 647                                 return ret;
 648                 }
 649
 650                 return pgraph->object_new(chan, handle, class);
 651         }
 652
 653         if (!chan->engctx[oc->engine]) {
 654                 ret = dev_priv->eng[oc->engine]->context_new(chan, oc->engine);
 655                 if (ret)
 656                         return ret;
 657         }
 658
 659         return dev_priv->eng[oc->engine]->object_new(chan, oc->engine, handle, class);
 660 }
 661
 662 static int
 663 nouveau_gpuobj_channel_init_pramin(struct nouveau_channel *chan)
 664 {
 665         struct drm_device *dev = chan->dev;
 666         struct drm_nouveau_private *dev_priv = dev->dev_private;
 667         uint32_t size;
 668         uint32_t base;
 669         int ret;
 670
 671         NV_DEBUG(dev, "ch%d\n", chan->id);
 672
 673         /* Base amount for object storage (4KiB enough?) */
 674         size = 0x2000;
 675         base = 0;
 676
 677         /* PGRAPH context */
 678         size += dev_priv->engine.graph.grctx_size;
 679
 680         if (dev_priv->card_type == NV_50) {
 681                 /* Various fixed table thingos */
 682                 size += 0x1400; /* mostly unknown stuff */
 683                 size += 0x4000; /* vm pd */
 684                 base  = 0x6000;
 685                 /* RAMHT, not sure about setting size yet, 32KiB to be safe */
 686                 size += 0x8000;
 687                 /* RAMFC */
 688                 size += 0x1000;
 689         }
 690
 691         ret = nouveau_gpuobj_new(dev, NULL, size, 0x1000, 0, &chan->ramin);
 692         if (ret) {
 693                 NV_ERROR(dev, "Error allocating channel PRAMIN: %d\n", ret);
 694                 return ret;
 695         }
 696
 697         ret = drm_mm_init(&chan->ramin_heap, base, size);
 698         if (ret) {
 699                 NV_ERROR(dev, "Error creating PRAMIN heap: %d\n", ret);
 700                 nouveau_gpuobj_ref(NULL, &chan->ramin);
 701                 return ret;
 702         }
 703
 704         return 0;
 705 }
 706
 707 int
 708 nouveau_gpuobj_channel_init(struct nouveau_channel *chan,
 709                             uint32_t vram_h, uint32_t tt_h)
 710 {
 711         struct drm_device *dev = chan->dev;
 712         struct drm_nouveau_private *dev_priv = dev->dev_private;
 713         struct nouveau_gpuobj *vram = NULL, *tt = NULL;
 714         int ret, i;
 715
 716         NV_DEBUG(dev, "ch%d vram=0x%08x tt=0x%08x\n", chan->id, vram_h, tt_h);
 717
 718         if (dev_priv->card_type == NV_C0) {
 719                 struct nouveau_vm *vm = dev_priv->chan_vm;
 720                 struct nouveau_vm_pgd *vpgd;
 721
 722                 ret = nouveau_gpuobj_new(dev, NULL, 4096, 0x1000, 0,
 723                                          &chan->ramin);
 724                 if (ret)
 725                         return ret;
 726
 727                 nouveau_vm_ref(vm, &chan->vm, NULL);
 728
 729                 vpgd = list_first_entry(&vm->pgd_list, struct nouveau_vm_pgd, head);
 730                 nv_wo32(chan->ramin, 0x0200, lower_32_bits(vpgd->obj->vinst));
 731                 nv_wo32(chan->ramin, 0x0204, upper_32_bits(vpgd->obj->vinst));
 732                 nv_wo32(chan->ramin, 0x0208, 0xffffffff);
 733                 nv_wo32(chan->ramin, 0x020c, 0x000000ff);
 734                 return 0;
 735         }
 736
 737         /* Allocate a chunk of memory for per-channel object storage */
 738         ret = nouveau_gpuobj_channel_init_pramin(chan);
 739         if (ret) {
 740                 NV_ERROR(dev, "init pramin\n");
 741                 return ret;
 742         }
 743
 744         /* NV50 VM
 745          *  - Allocate per-channel page-directory
 746          *  - Link with shared channel VM
 747          */
 748         if (dev_priv->chan_vm) {
 749                 u32 pgd_offs = (dev_priv->chipset == 0x50) ? 0x1400 : 0x0200;
 750                 u64 vm_vinst = chan->ramin->vinst + pgd_offs;
 751                 u32 vm_pinst = chan->ramin->pinst;
 752
 753                 if (vm_pinst != ~0)
 754                         vm_pinst += pgd_offs;
 755
 756                 ret = nouveau_gpuobj_new_fake(dev, vm_pinst, vm_vinst, 0x4000,
 757                                               0, &chan->vm_pd);
 758                 if (ret)
 759                         return ret;
 760
 761                 nouveau_vm_ref(dev_priv->chan_vm, &chan->vm, chan->vm_pd);
 762         }
 763
 764         /* RAMHT */
 765         if (dev_priv->card_type < NV_50) {
 766                 nouveau_ramht_ref(dev_priv->ramht, &chan->ramht, NULL);
 767         } else {
 768                 struct nouveau_gpuobj *ramht = NULL;
 769
 770                 ret = nouveau_gpuobj_new(dev, chan, 0x8000, 16,
 771                                          NVOBJ_FLAG_ZERO_ALLOC, &ramht);
 772                 if (ret)
 773                         return ret;
 774
 775                 ret = nouveau_ramht_new(dev, ramht, &chan->ramht);
 776                 nouveau_gpuobj_ref(NULL, &ramht);
 777                 if (ret)
 778                         return ret;
 779
 780                 /* dma objects for display sync channel semaphore blocks */
 781                 for (i = 0; i < 2; i++) {
 782                         struct nouveau_gpuobj *sem = NULL;
 783                         struct nv50_display_crtc *dispc =
 784                                 &nv50_display(dev)->crtc[i];
 785                         u64 offset = dispc->sem.bo->bo.mem.start << PAGE_SHIFT;
 786
 787                         ret = nouveau_gpuobj_dma_new(chan, 0x3d, offset, 0xfff,
 788                                                      NV_MEM_ACCESS_RW,
 789                                                      NV_MEM_TARGET_VRAM, &sem);
 790                         if (ret)
 791                                 return ret;
 792
 793                         ret = nouveau_ramht_insert(chan, NvEvoSema0 + i, sem);
 794                         nouveau_gpuobj_ref(NULL, &sem);
 795                         if (ret)
 796                                 return ret;
 797                 }
 798         }
 799
 800         /* VRAM ctxdma */
 801         if (dev_priv->card_type >= NV_50) {
 802                 ret = nouveau_gpuobj_dma_new(chan, NV_CLASS_DMA_IN_MEMORY,
 803                                              0, (1ULL << 40), NV_MEM_ACCESS_RW,
 804                                              NV_MEM_TARGET_VM, &vram);
 805                 if (ret) {
 806                         NV_ERROR(dev, "Error creating VRAM ctxdma: %d\n", ret);
 807                         return ret;
 808                 }
 809         } else {
 810                 ret = nouveau_gpuobj_dma_new(chan, NV_CLASS_DMA_IN_MEMORY,
 811                                              0, dev_priv->fb_available_size,
 812                                              NV_MEM_ACCESS_RW,
 813                                              NV_MEM_TARGET_VRAM, &vram);
 814                 if (ret) {
 815                         NV_ERROR(dev, "Error creating VRAM ctxdma: %d\n", ret);
 816                         return ret;
 817                 }
 818         }
 819
 820         ret = nouveau_ramht_insert(chan, vram_h, vram);
 821         nouveau_gpuobj_ref(NULL, &vram);
 822         if (ret) {
 823                 NV_ERROR(dev, "Error adding VRAM ctxdma to RAMHT: %d\n", ret);
 824                 return ret;
 825         }
 826
 827         /* TT memory ctxdma */
 828         if (dev_priv->card_type >= NV_50) {
 829                 ret = nouveau_gpuobj_dma_new(chan, NV_CLASS_DMA_IN_MEMORY,
 830                                              0, (1ULL << 40), NV_MEM_ACCESS_RW,
 831                                              NV_MEM_TARGET_VM, &tt);
 832         } else {
 833                 ret = nouveau_gpuobj_dma_new(chan, NV_CLASS_DMA_IN_MEMORY,
 834                                              0, dev_priv->gart_info.aper_size,
 835                                              NV_MEM_ACCESS_RW,
 836                                              NV_MEM_TARGET_GART, &tt);
 837         }
 838
 839         if (ret) {
 840                 NV_ERROR(dev, "Error creating TT ctxdma: %d\n", ret);
 841                 return ret;
 842         }
 843
 844         ret = nouveau_ramht_insert(chan, tt_h, tt);
 845         nouveau_gpuobj_ref(NULL, &tt);
 846         if (ret) {
 847                 NV_ERROR(dev, "Error adding TT ctxdma to RAMHT: %d\n", ret);
 848                 return ret;
 849         }
 850
 851         return 0;
 852 }
 853
 854 void
 855 nouveau_gpuobj_channel_takedown(struct nouveau_channel *chan)
 856 {
 857         struct drm_device *dev = chan->dev;
 858
 859         NV_DEBUG(dev, "ch%d\n", chan->id);
 860
 861         nouveau_ramht_ref(NULL, &chan->ramht, chan);
 862
 863         nouveau_vm_ref(NULL, &chan->vm, chan->vm_pd);
 864         nouveau_gpuobj_ref(NULL, &chan->vm_pd);
 865
 866         if (drm_mm_initialized(&chan->ramin_heap))
 867                 drm_mm_takedown(&chan->ramin_heap);
 868         nouveau_gpuobj_ref(NULL, &chan->ramin);
 869 }
 870
 871 int
 872 nouveau_gpuobj_suspend(struct drm_device *dev)
 873 {
 874         struct drm_nouveau_private *dev_priv = dev->dev_private;
 875         struct nouveau_gpuobj *gpuobj;
 876         int i;
 877
 878         list_for_each_entry(gpuobj, &dev_priv->gpuobj_list, list) {
 879                 if (gpuobj->cinst != NVOBJ_CINST_GLOBAL)
 880                         continue;
 881
 882                 gpuobj->suspend = vmalloc(gpuobj->size);
 883                 if (!gpuobj->suspend) {
 884                         nouveau_gpuobj_resume(dev);
 885                         return -ENOMEM;
 886                 }
 887
 888                 for (i = 0; i < gpuobj->size; i += 4)
 889                         gpuobj->suspend[i/4] = nv_ro32(gpuobj, i);
 890         }
 891
 892         return 0;
 893 }
 894
 895 void
 896 nouveau_gpuobj_resume(struct drm_device *dev)
 897 {
 898         struct drm_nouveau_private *dev_priv = dev->dev_private;
 899         struct nouveau_gpuobj *gpuobj;
 900         int i;
 901
 902         list_for_each_entry(gpuobj, &dev_priv->gpuobj_list, list) {
 903                 if (!gpuobj->suspend)
 904                         continue;
 905
 906                 for (i = 0; i < gpuobj->size; i += 4)
 907                         nv_wo32(gpuobj, i, gpuobj->suspend[i/4]);
 908
 909                 vfree(gpuobj->suspend);
 910                 gpuobj->suspend = NULL;
 911         }
 912
 913         dev_priv->engine.instmem.flush(dev);
 914 }
 915
 916 int nouveau_ioctl_grobj_alloc(struct drm_device *dev, void *data,
 917                               struct drm_file *file_priv)
 918 {
 919         struct drm_nouveau_grobj_alloc *init = data;
 920         struct nouveau_channel *chan;
 921         int ret;
 922
 923         if (init->handle == ~0)
 924                 return -EINVAL;
 925
 926         chan = nouveau_channel_get(dev, file_priv, init->channel);
 927         if (IS_ERR(chan))
 928                 return PTR_ERR(chan);
 929
 930         if (nouveau_ramht_find(chan, init->handle)) {
 931                 ret = -EEXIST;
 932                 goto out;
 933         }
 934
 935         ret = nouveau_gpuobj_gr_new(chan, init->handle, init->class);
 936         if (ret) {
 937                 NV_ERROR(dev, "Error creating object: %d (%d/0x%08x)\n",
 938                          ret, init->channel, init->handle);
 939         }
 940
 941 out:
 942         nouveau_channel_put(&chan);
 943         return ret;
 944 }
 945
 946 int nouveau_ioctl_gpuobj_free(struct drm_device *dev, void *data,
 947                               struct drm_file *file_priv)
 948 {
 949         struct drm_nouveau_gpuobj_free *objfree = data;
 950         struct nouveau_channel *chan;
 951         int ret;
 952
 953         chan = nouveau_channel_get(dev, file_priv, objfree->channel);
 954         if (IS_ERR(chan))
 955                 return PTR_ERR(chan);
 956
 957         /* Synchronize with the user channel */
 958         nouveau_channel_idle(chan);
 959
 960         ret = nouveau_ramht_remove(chan, objfree->handle);
 961         nouveau_channel_put(&chan);
 962         return ret;
 963 }
 964
 965 u32
 966 nv_ro32(struct nouveau_gpuobj *gpuobj, u32 offset)
 967 {
 968         struct drm_nouveau_private *dev_priv = gpuobj->dev->dev_private;
 969         struct drm_device *dev = gpuobj->dev;
 970         unsigned long flags;
 971
 972         if (gpuobj->pinst == ~0 || !dev_priv->ramin_available) {
 973                 u64  ptr = gpuobj->vinst + offset;
 974                 u32 base = ptr >> 16;
 975                 u32  val;
 976
 977                 spin_lock_irqsave(&dev_priv->vm_lock, flags);
 978                 if (dev_priv->ramin_base != base) {
 979                         dev_priv->ramin_base = base;
 980                         nv_wr32(dev, 0x001700, dev_priv->ramin_base);
 981                 }
 982                 val = nv_rd32(dev, 0x700000 + (ptr & 0xffff));
 983                 spin_unlock_irqrestore(&dev_priv->vm_lock, flags);
 984                 return val;
 985         }
 986
 987         return nv_ri32(dev, gpuobj->pinst + offset);
 988 }
 989
 990 void
 991 nv_wo32(struct nouveau_gpuobj *gpuobj, u32 offset, u32 val)
 992 {
 993         struct drm_nouveau_private *dev_priv = gpuobj->dev->dev_private;
 994         struct drm_device *dev = gpuobj->dev;
 995         unsigned long flags;
 996
 997         if (gpuobj->pinst == ~0 || !dev_priv->ramin_available) {
 998                 u64  ptr = gpuobj->vinst + offset;
 999                 u32 base = ptr >> 16;
1000
1001                 spin_lock_irqsave(&dev_priv->vm_lock, flags);
1002                 if (dev_priv->ramin_base != base) {
1003                         dev_priv->ramin_base = base;
1004                         nv_wr32(dev, 0x001700, dev_priv->ramin_base);
1005                 }
1006                 nv_wr32(dev, 0x700000 + (ptr & 0xffff), val);
1007                 spin_unlock_irqrestore(&dev_priv->vm_lock, flags);
1008                 return;
1009         }
1010
1011         nv_wi32(dev, gpuobj->pinst + offset, val);
1012 }