gpu: nvgpu: Use common allocator for patch

author Terje Bergstrom <tbergstrom@nvidia.com>

Sat, 21 Mar 2015 15:10:59 +0000 (08:10 -0700)

committer Terje Bergstrom <tbergstrom@nvidia.com>

Wed, 8 Apr 2015 22:37:18 +0000 (15:37 -0700)
author Terje Bergstrom <tbergstrom@nvidia.com>
Sat, 21 Mar 2015 15:10:59 +0000 (08:10 -0700)
committer Terje Bergstrom <tbergstrom@nvidia.com>
Wed, 8 Apr 2015 22:37:18 +0000 (15:37 -0700)
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c

index d32db731b172675ebc349e23556d3cd7e9d0a5df..018d44293b706250c8f66b90c825fd3da07f7f3f 100644 (file)
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -597,16 +597,16 @@ int gr_gk20a_ctx_patch_write_begin(struct gk20a *g,
                                           struct channel_ctx_gk20a *ch_ctx)
  {
         /* being defensive still... */
-       if (WARN_ON(ch_ctx->patch_ctx.cpu_va)) {
+       if (WARN_ON(ch_ctx->patch_ctx.mem.cpu_va)) {
                 gk20a_err(dev_from_gk20a(g), "nested ctx patch begin?");
                 return -EBUSY;
         }
  
-       ch_ctx->patch_ctx.cpu_va = vmap(ch_ctx->patch_ctx.pages,
-                       PAGE_ALIGN(ch_ctx->patch_ctx.size) >> PAGE_SHIFT,
+       ch_ctx->patch_ctx.mem.cpu_va = vmap(ch_ctx->patch_ctx.mem.pages,
+                       PAGE_ALIGN(ch_ctx->patch_ctx.mem.size) >> PAGE_SHIFT,
                         0, pgprot_dmacoherent(PAGE_KERNEL));
  
-       if (!ch_ctx->patch_ctx.cpu_va)
+       if (!ch_ctx->patch_ctx.mem.cpu_va)
                 return -ENOMEM;
  
         return 0;
@@ -616,13 +616,13 @@ int gr_gk20a_ctx_patch_write_end(struct gk20a *g,
                                         struct channel_ctx_gk20a *ch_ctx)
  {
         /* being defensive still... */
-       if (!ch_ctx->patch_ctx.cpu_va) {
+       if (!ch_ctx->patch_ctx.mem.cpu_va) {
                 gk20a_err(dev_from_gk20a(g), "dangling ctx patch end?");
                 return -EINVAL;
         }
  
-       vunmap(ch_ctx->patch_ctx.cpu_va);
-       ch_ctx->patch_ctx.cpu_va = NULL;
+       vunmap(ch_ctx->patch_ctx.mem.cpu_va);
+       ch_ctx->patch_ctx.mem.cpu_va = NULL;
         return 0;
  }
  
@@ -642,7 +642,7 @@ int gr_gk20a_ctx_patch_write(struct gk20a *g,
                 /* we added an optimization prolog, epilog
                  * to get rid of unnecessary maps and l2 invals.
                  * but be defensive still... */
-               if (!ch_ctx->patch_ctx.cpu_va) {
+               if (!ch_ctx->patch_ctx.mem.cpu_va) {
                         int err;
                         gk20a_err(dev_from_gk20a(g),
                                    "per-write ctx patch begin?");
@@ -654,7 +654,7 @@ int gr_gk20a_ctx_patch_write(struct gk20a *g,
                 } else
                         mapped_here = false;
  
-               patch_ptr = ch_ctx->patch_ctx.cpu_va;
+               patch_ptr = ch_ctx->patch_ctx.mem.cpu_va;
                 patch_slot = ch_ctx->patch_ctx.data_count * 2;
  
                 gk20a_mem_wr32(patch_ptr, patch_slot++, addr);
@@ -1622,8 +1622,8 @@ int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
         gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_num_save_ops_o(), 0, 0);
         gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_num_restore_ops_o(), 0, 0);
  
-       virt_addr_lo = u64_lo32(ch_ctx->patch_ctx.gpu_va);
-       virt_addr_hi = u64_hi32(ch_ctx->patch_ctx.gpu_va);
+       virt_addr_lo = u64_lo32(ch_ctx->patch_ctx.mem.gpu_va);
+       virt_addr_hi = u64_hi32(ch_ctx->patch_ctx.mem.gpu_va);
  
         gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_patch_count_o(), 0,
                  ch_ctx->patch_ctx.data_count);
@@ -2568,82 +2568,33 @@ static int gr_gk20a_alloc_channel_patch_ctx(struct gk20a *g,
                                 struct channel_gk20a *c)
  {
         struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
-       struct device *d = dev_from_gk20a(g);
         struct vm_gk20a *ch_vm = c->vm;
-       DEFINE_DMA_ATTRS(attrs);
-       struct sg_table *sgt;
         int err = 0;
-       dma_addr_t iova;
  
         gk20a_dbg_fn("");
  
-       patch_ctx->size = 128 * sizeof(u32);
-       dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, &attrs);
-       patch_ctx->pages = dma_alloc_attrs(d, patch_ctx->size,
-                               &iova, GFP_KERNEL,
-                               &attrs);
-       if (!patch_ctx->pages)
-               return -ENOMEM;
-
-       patch_ctx->iova = iova;
-       err = gk20a_get_sgtable_from_pages(d, &sgt, patch_ctx->pages,
-                       patch_ctx->iova, patch_ctx->size);
+       err = gk20a_gmmu_alloc_map_attr(ch_vm, DMA_ATTR_NO_KERNEL_MAPPING,
+                                       128 * sizeof(u32), &patch_ctx->mem);
         if (err)
-               goto err_free;
-
-       patch_ctx->gpu_va = gk20a_gmmu_map(ch_vm, &sgt, patch_ctx->size,
-                                       0, gk20a_mem_flag_none);
-       if (!patch_ctx->gpu_va)
-               goto err_free_sgtable;
-
-       gk20a_free_sgtable(&sgt);
+               return err;
  
         gk20a_dbg_fn("done");
         return 0;
-
- err_free_sgtable:
-       gk20a_free_sgtable(&sgt);
- err_free:
-       dma_free_attrs(d, patch_ctx->size,
-               patch_ctx->pages, patch_ctx->iova, &attrs);
-       patch_ctx->pages = NULL;
-       patch_ctx->iova = 0;
-       gk20a_err(dev_from_gk20a(g), "fail");
-       return err;
-}
-
-static void gr_gk20a_unmap_channel_patch_ctx(struct channel_gk20a *c)
-{
-       struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
-       struct vm_gk20a *ch_vm = c->vm;
-
-       gk20a_dbg_fn("");
-
-       if (patch_ctx->gpu_va)
-               gk20a_gmmu_unmap(ch_vm, patch_ctx->gpu_va,
-                       patch_ctx->size, gk20a_mem_flag_none);
-       patch_ctx->gpu_va = 0;
-       patch_ctx->data_count = 0;
  }
  
  static void gr_gk20a_free_channel_patch_ctx(struct channel_gk20a *c)
  {
         struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
         struct gk20a *g = c->g;
-       struct device *d = dev_from_gk20a(g);
-       DEFINE_DMA_ATTRS(attrs);
  
         gk20a_dbg_fn("");
  
-       gr_gk20a_unmap_channel_patch_ctx(c);
+       if (patch_ctx->mem.gpu_va)
+               gk20a_gmmu_unmap(c->vm, patch_ctx->mem.gpu_va,
+                                patch_ctx->mem.size, gk20a_mem_flag_none);
  
-       if (patch_ctx->pages) {
-               dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, &attrs);
-               dma_free_attrs(d, patch_ctx->size,
-                       patch_ctx->pages, patch_ctx->iova, &attrs);
-               patch_ctx->pages = NULL;
-               patch_ctx->iova = 0;
-       }
+       gk20a_gmmu_free_attr(g, DMA_ATTR_NO_KERNEL_MAPPING, &patch_ctx->mem);
+       patch_ctx->data_count = 0;
  }
  
  void gk20a_free_channel_ctx(struct channel_gk20a *c)
@@ -2757,7 +2708,7 @@ int gk20a_alloc_obj_ctx(struct channel_gk20a  *c,
         }
  
         /* allocate patch buffer */
-       if (ch_ctx->patch_ctx.pages == NULL) {
+       if (ch_ctx->patch_ctx.mem.sgt == NULL) {
                 err = gr_gk20a_alloc_channel_patch_ctx(g, c);
                 if (err) {
                         gk20a_err(dev_from_gk20a(g),
@@ -2883,7 +2834,7 @@ int gk20a_free_obj_ctx(struct channel_gk20a  *c,
                 gk20a_disable_channel(c,
                         !c->has_timedout,
                         timeout);
-               gr_gk20a_unmap_channel_patch_ctx(c);
+               gr_gk20a_free_channel_patch_ctx(c);
         }
  
         return 0;
@@ -6081,8 +6032,8 @@ static int gr_gk20a_ctx_patch_smpc(struct gk20a *g,
                                 gr_gk20a_ctx_patch_write(g, ch_ctx,
                                                          addr, data, true);
  
-                               vaddr_lo = u64_lo32(ch_ctx->patch_ctx.gpu_va);
-                               vaddr_hi = u64_hi32(ch_ctx->patch_ctx.gpu_va);
+                               vaddr_lo = u64_lo32(ch_ctx->patch_ctx.mem.gpu_va);
+                               vaddr_hi = u64_hi32(ch_ctx->patch_ctx.mem.gpu_va);
  
                                 gk20a_mem_wr32(context +
                                          ctxsw_prog_main_image_patch_count_o(),
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c

index c816836e3c8c51dd6c4d4ba43129020233e455c4..bfd6ff8629703a540e9ecc68acec976f4d7ed1cd 100644 (file)
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -1616,6 +1616,7 @@ void gk20a_gmmu_free_attr(struct gk20a *g, enum dma_attr attr,
                 }
  
                 mem->cpu_va = NULL;
+               mem->pages = NULL;
         }
  
         if (mem->sgt)
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h

index 9165953710f3071d61e8d62341b3f5262ad180f3..df9ebec32c80ea5df900535f9cec9b8070d316a0 100644 (file)
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -68,11 +68,7 @@ struct gpfifo_desc {
  };
  
  struct patch_desc {
-       struct page **pages;
-       u64 iova;
-       size_t size;
-       void *cpu_va;
-       u64 gpu_va;
+       struct mem_desc mem;
         u32 data_count;
  };
  
diff --git a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c

index fd8bb81bf9ce4d743cc930f85951cf257f0bef67..8d0bb6cf1daa5fd214cd5cb486b4a44b71ea0a40 100644 (file)
--- a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
@@ -321,18 +321,20 @@ static int vgpu_gr_alloc_channel_patch_ctx(struct gk20a *g,
  
         gk20a_dbg_fn("");
  
-       patch_ctx->size = 128 * sizeof(u32);
-       patch_ctx->gpu_va = gk20a_vm_alloc_va(ch_vm, patch_ctx->size, 0);
-       if (!patch_ctx->gpu_va)
+       patch_ctx->mem.size = 128 * sizeof(u32);
+       patch_ctx->mem.gpu_va = gk20a_vm_alloc_va(ch_vm,
+                                                 patch_ctx->mem.size, 0);
+       if (!patch_ctx->mem.gpu_va)
                 return -ENOMEM;
  
         msg.cmd = TEGRA_VGPU_CMD_CHANNEL_ALLOC_GR_PATCH_CTX;
         msg.handle = platform->virt_handle;
         p->handle = c->virt_ctx;
-       p->patch_ctx_va = patch_ctx->gpu_va;
+       p->patch_ctx_va = patch_ctx->mem.gpu_va;
         err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
         if (err || msg.ret) {
-               gk20a_vm_free_va(ch_vm, patch_ctx->gpu_va, patch_ctx->size, 0);
+               gk20a_vm_free_va(ch_vm, patch_ctx->mem.gpu_va,
+                                patch_ctx->mem.size, 0);
                 err = -ENOMEM;
         }
  
@@ -347,7 +349,7 @@ static void vgpu_gr_free_channel_patch_ctx(struct channel_gk20a *c)
  
         gk20a_dbg_fn("");
  
-       if (patch_ctx->gpu_va) {
+       if (patch_ctx->mem.gpu_va) {
                 struct tegra_vgpu_cmd_msg msg;
                 struct tegra_vgpu_gr_ctx_params *p = &msg.params.gr_ctx;
                 int err;
@@ -358,8 +360,9 @@ static void vgpu_gr_free_channel_patch_ctx(struct channel_gk20a *c)
                 err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
                 WARN_ON(err || msg.ret);
  
-               gk20a_vm_free_va(ch_vm, patch_ctx->gpu_va, patch_ctx->size, 0);
-               patch_ctx->gpu_va = 0;
+               gk20a_vm_free_va(ch_vm, patch_ctx->mem.gpu_va,
+                                patch_ctx->mem.size, 0);
+               patch_ctx->mem.gpu_va = 0;
         }
  }
  
@@ -438,7 +441,7 @@ static int vgpu_gr_alloc_obj_ctx(struct channel_gk20a  *c,
         }
  
         /* allocate patch buffer */
-       if (ch_ctx->patch_ctx.pages == NULL) {
+       if (ch_ctx->patch_ctx.mem.pages == NULL) {
                 err = vgpu_gr_alloc_channel_patch_ctx(g, c);
                 if (err) {
                         gk20a_err(dev_from_gk20a(g),
author	Terje Bergstrom <tbergstrom@nvidia.com>
	Sat, 21 Mar 2015 15:10:59 +0000 (08:10 -0700)
committer	Terje Bergstrom <tbergstrom@nvidia.com>
	Wed, 8 Apr 2015 22:37:18 +0000 (15:37 -0700)
drivers/gpu/nvgpu/gk20a/gr_gk20a.c		patch \| blob \| history
drivers/gpu/nvgpu/gk20a/mm_gk20a.c		patch \| blob \| history
drivers/gpu/nvgpu/gk20a/mm_gk20a.h		patch \| blob \| history
drivers/gpu/nvgpu/vgpu/gr_vgpu.c		patch \| blob \| history