Commit ad926015 authored by Mikko Perttunen's avatar Mikko Perttunen Committed by Thierry Reding

drm/tegra: Add Tegra DRM allocation API

Add a new IO virtual memory allocation API to allow clients to
allocate non-GEM memory in the Tegra DRM IOMMU domain. This is
required e.g. for loading client firmware when clients are attached
to the IOMMU domain.

The allocator allocates contiguous physical pages that are then
mapped contiguously to the IOMMU domain using the iova_domain
library provided by the kernel. Contiguous physical pages are
used so that the same allocator works also when IOMMU support
is disabled and therefore devices access physical memory directly.
Signed-off-by: default avatarMikko Perttunen <mperttunen@nvidia.com>
Signed-off-by: default avatarThierry Reding <treding@nvidia.com>
parent 5e91144d
/* /*
* Copyright (C) 2012 Avionic Design GmbH * Copyright (C) 2012 Avionic Design GmbH
* Copyright (C) 2012-2013 NVIDIA CORPORATION. All rights reserved. * Copyright (C) 2012-2016 NVIDIA CORPORATION. All rights reserved.
* *
* This program is free software; you can redistribute it and/or modify * This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License version 2 as * it under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation. * published by the Free Software Foundation.
*/ */
#include <linux/bitops.h>
#include <linux/host1x.h> #include <linux/host1x.h>
#include <linux/idr.h> #include <linux/idr.h>
#include <linux/iommu.h> #include <linux/iommu.h>
...@@ -24,6 +25,8 @@ ...@@ -24,6 +25,8 @@
#define DRIVER_MINOR 0 #define DRIVER_MINOR 0
#define DRIVER_PATCHLEVEL 0 #define DRIVER_PATCHLEVEL 0
#define CARVEOUT_SZ SZ_64M
struct tegra_drm_file { struct tegra_drm_file {
struct idr contexts; struct idr contexts;
struct mutex lock; struct mutex lock;
...@@ -128,8 +131,9 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags) ...@@ -128,8 +131,9 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags)
return -ENOMEM; return -ENOMEM;
if (iommu_present(&platform_bus_type)) { if (iommu_present(&platform_bus_type)) {
u64 carveout_start, carveout_end, gem_start, gem_end;
struct iommu_domain_geometry *geometry; struct iommu_domain_geometry *geometry;
u64 start, end; unsigned long order;
tegra->domain = iommu_domain_alloc(&platform_bus_type); tegra->domain = iommu_domain_alloc(&platform_bus_type);
if (!tegra->domain) { if (!tegra->domain) {
...@@ -138,13 +142,26 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags) ...@@ -138,13 +142,26 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags)
} }
geometry = &tegra->domain->geometry; geometry = &tegra->domain->geometry;
start = geometry->aperture_start; gem_start = geometry->aperture_start;
end = geometry->aperture_end; gem_end = geometry->aperture_end - CARVEOUT_SZ;
carveout_start = gem_end + 1;
carveout_end = geometry->aperture_end;
order = __ffs(tegra->domain->pgsize_bitmap);
init_iova_domain(&tegra->carveout.domain, 1UL << order,
carveout_start >> order,
carveout_end >> order);
tegra->carveout.shift = iova_shift(&tegra->carveout.domain);
tegra->carveout.limit = carveout_end >> tegra->carveout.shift;
DRM_DEBUG_DRIVER("IOMMU aperture initialized (%#llx-%#llx)\n", drm_mm_init(&tegra->mm, gem_start, gem_end - gem_start + 1);
start, end);
drm_mm_init(&tegra->mm, start, end - start + 1);
mutex_init(&tegra->mm_lock); mutex_init(&tegra->mm_lock);
DRM_DEBUG("IOMMU apertures:\n");
DRM_DEBUG(" GEM: %#llx-%#llx\n", gem_start, gem_end);
DRM_DEBUG(" Carveout: %#llx-%#llx\n", carveout_start,
carveout_end);
} }
mutex_init(&tegra->clients_lock); mutex_init(&tegra->clients_lock);
...@@ -214,6 +231,7 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags) ...@@ -214,6 +231,7 @@ static int tegra_drm_load(struct drm_device *drm, unsigned long flags)
iommu_domain_free(tegra->domain); iommu_domain_free(tegra->domain);
drm_mm_takedown(&tegra->mm); drm_mm_takedown(&tegra->mm);
mutex_destroy(&tegra->mm_lock); mutex_destroy(&tegra->mm_lock);
put_iova_domain(&tegra->carveout.domain);
} }
free: free:
kfree(tegra); kfree(tegra);
...@@ -239,6 +257,7 @@ static void tegra_drm_unload(struct drm_device *drm) ...@@ -239,6 +257,7 @@ static void tegra_drm_unload(struct drm_device *drm)
iommu_domain_free(tegra->domain); iommu_domain_free(tegra->domain);
drm_mm_takedown(&tegra->mm); drm_mm_takedown(&tegra->mm);
mutex_destroy(&tegra->mm_lock); mutex_destroy(&tegra->mm_lock);
put_iova_domain(&tegra->carveout.domain);
} }
kfree(tegra); kfree(tegra);
...@@ -1030,6 +1049,84 @@ int tegra_drm_unregister_client(struct tegra_drm *tegra, ...@@ -1030,6 +1049,84 @@ int tegra_drm_unregister_client(struct tegra_drm *tegra,
return 0; return 0;
} }
void *tegra_drm_alloc(struct tegra_drm *tegra, size_t size,
dma_addr_t *dma)
{
struct iova *alloc;
void *virt;
gfp_t gfp;
int err;
if (tegra->domain)
size = iova_align(&tegra->carveout.domain, size);
else
size = PAGE_ALIGN(size);
gfp = GFP_KERNEL | __GFP_ZERO;
if (!tegra->domain) {
/*
* Many units only support 32-bit addresses, even on 64-bit
* SoCs. If there is no IOMMU to translate into a 32-bit IO
* virtual address space, force allocations to be in the
* lower 32-bit range.
*/
gfp |= GFP_DMA;
}
virt = (void *)__get_free_pages(gfp, get_order(size));
if (!virt)
return ERR_PTR(-ENOMEM);
if (!tegra->domain) {
/*
* If IOMMU is disabled, devices address physical memory
* directly.
*/
*dma = virt_to_phys(virt);
return virt;
}
alloc = alloc_iova(&tegra->carveout.domain,
size >> tegra->carveout.shift,
tegra->carveout.limit, true);
if (!alloc) {
err = -EBUSY;
goto free_pages;
}
*dma = iova_dma_addr(&tegra->carveout.domain, alloc);
err = iommu_map(tegra->domain, *dma, virt_to_phys(virt),
size, IOMMU_READ | IOMMU_WRITE);
if (err < 0)
goto free_iova;
return virt;
free_iova:
__free_iova(&tegra->carveout.domain, alloc);
free_pages:
free_pages((unsigned long)virt, get_order(size));
return ERR_PTR(err);
}
void tegra_drm_free(struct tegra_drm *tegra, size_t size, void *virt,
dma_addr_t dma)
{
if (tegra->domain)
size = iova_align(&tegra->carveout.domain, size);
else
size = PAGE_ALIGN(size);
if (tegra->domain) {
iommu_unmap(tegra->domain, dma, size);
free_iova(&tegra->carveout.domain,
iova_pfn(&tegra->carveout.domain, dma));
}
free_pages((unsigned long)virt, get_order(size));
}
static int host1x_drm_probe(struct host1x_device *dev) static int host1x_drm_probe(struct host1x_device *dev)
{ {
struct drm_driver *driver = &tegra_drm_driver; struct drm_driver *driver = &tegra_drm_driver;
......
...@@ -12,6 +12,7 @@ ...@@ -12,6 +12,7 @@
#include <uapi/drm/tegra_drm.h> #include <uapi/drm/tegra_drm.h>
#include <linux/host1x.h> #include <linux/host1x.h>
#include <linux/iova.h>
#include <linux/of_gpio.h> #include <linux/of_gpio.h>
#include <drm/drmP.h> #include <drm/drmP.h>
...@@ -45,6 +46,12 @@ struct tegra_drm { ...@@ -45,6 +46,12 @@ struct tegra_drm {
struct mutex mm_lock; struct mutex mm_lock;
struct drm_mm mm; struct drm_mm mm;
struct {
struct iova_domain domain;
unsigned long shift;
unsigned long limit;
} carveout;
struct mutex clients_lock; struct mutex clients_lock;
struct list_head clients; struct list_head clients;
...@@ -106,6 +113,10 @@ int tegra_drm_unregister_client(struct tegra_drm *tegra, ...@@ -106,6 +113,10 @@ int tegra_drm_unregister_client(struct tegra_drm *tegra,
int tegra_drm_init(struct tegra_drm *tegra, struct drm_device *drm); int tegra_drm_init(struct tegra_drm *tegra, struct drm_device *drm);
int tegra_drm_exit(struct tegra_drm *tegra); int tegra_drm_exit(struct tegra_drm *tegra);
void *tegra_drm_alloc(struct tegra_drm *tegra, size_t size, dma_addr_t *iova);
void tegra_drm_free(struct tegra_drm *tegra, size_t size, void *virt,
dma_addr_t iova);
struct tegra_dc_soc_info; struct tegra_dc_soc_info;
struct tegra_output; struct tegra_output;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment