1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright (c) 2018 The Linux Foundation. All rights reserved. */
3 
4 #include <linux/dma-mapping.h>
5 
6 #include "msm_drv.h"
7 #include "msm_mmu.h"
8 #include "adreno/adreno_gpu.h"
9 #include "adreno/a2xx.xml.h"
10 
11 struct msm_gpummu {
12 	struct msm_mmu base;
13 	struct msm_gpu *gpu;
14 	dma_addr_t pt_base;
15 	uint32_t *table;
16 };
17 #define to_msm_gpummu(x) container_of(x, struct msm_gpummu, base)
18 
19 #define GPUMMU_VA_START SZ_16M
20 #define GPUMMU_VA_RANGE (0xfff * SZ_64K)
21 #define GPUMMU_PAGE_SIZE SZ_4K
22 #define TABLE_SIZE (sizeof(uint32_t) * GPUMMU_VA_RANGE / GPUMMU_PAGE_SIZE)
23 
msm_gpummu_detach(struct msm_mmu * mmu)24 static void msm_gpummu_detach(struct msm_mmu *mmu)
25 {
26 }
27 
msm_gpummu_map(struct msm_mmu * mmu,uint64_t iova,struct sg_table * sgt,size_t len,int prot)28 static int msm_gpummu_map(struct msm_mmu *mmu, uint64_t iova,
29 		struct sg_table *sgt, size_t len, int prot)
30 {
31 	struct msm_gpummu *gpummu = to_msm_gpummu(mmu);
32 	unsigned idx = (iova - GPUMMU_VA_START) / GPUMMU_PAGE_SIZE;
33 	struct sg_dma_page_iter dma_iter;
34 	unsigned prot_bits = 0;
35 
36 	if (prot & IOMMU_WRITE)
37 		prot_bits |= 1;
38 	if (prot & IOMMU_READ)
39 		prot_bits |= 2;
40 
41 	for_each_sgtable_dma_page(sgt, &dma_iter, 0) {
42 		dma_addr_t addr = sg_page_iter_dma_address(&dma_iter);
43 		int i;
44 
45 		for (i = 0; i < PAGE_SIZE; i += GPUMMU_PAGE_SIZE)
46 			gpummu->table[idx++] = (addr + i) | prot_bits;
47 	}
48 
49 	/* we can improve by deferring flush for multiple map() */
50 	gpu_write(gpummu->gpu, REG_A2XX_MH_MMU_INVALIDATE,
51 		A2XX_MH_MMU_INVALIDATE_INVALIDATE_ALL |
52 		A2XX_MH_MMU_INVALIDATE_INVALIDATE_TC);
53 	return 0;
54 }
55 
msm_gpummu_unmap(struct msm_mmu * mmu,uint64_t iova,size_t len)56 static int msm_gpummu_unmap(struct msm_mmu *mmu, uint64_t iova, size_t len)
57 {
58 	struct msm_gpummu *gpummu = to_msm_gpummu(mmu);
59 	unsigned idx = (iova - GPUMMU_VA_START) / GPUMMU_PAGE_SIZE;
60 	unsigned i;
61 
62 	for (i = 0; i < len / GPUMMU_PAGE_SIZE; i++, idx++)
63                 gpummu->table[idx] = 0;
64 
65 	gpu_write(gpummu->gpu, REG_A2XX_MH_MMU_INVALIDATE,
66 		A2XX_MH_MMU_INVALIDATE_INVALIDATE_ALL |
67 		A2XX_MH_MMU_INVALIDATE_INVALIDATE_TC);
68 	return 0;
69 }
70 
msm_gpummu_resume_translation(struct msm_mmu * mmu)71 static void msm_gpummu_resume_translation(struct msm_mmu *mmu)
72 {
73 }
74 
msm_gpummu_destroy(struct msm_mmu * mmu)75 static void msm_gpummu_destroy(struct msm_mmu *mmu)
76 {
77 	struct msm_gpummu *gpummu = to_msm_gpummu(mmu);
78 
79 	dma_free_attrs(mmu->dev, TABLE_SIZE, gpummu->table, gpummu->pt_base,
80 		DMA_ATTR_FORCE_CONTIGUOUS);
81 
82 	kfree(gpummu);
83 }
84 
85 static const struct msm_mmu_funcs funcs = {
86 		.detach = msm_gpummu_detach,
87 		.map = msm_gpummu_map,
88 		.unmap = msm_gpummu_unmap,
89 		.destroy = msm_gpummu_destroy,
90 		.resume_translation = msm_gpummu_resume_translation,
91 };
92 
msm_gpummu_new(struct device * dev,struct msm_gpu * gpu)93 struct msm_mmu *msm_gpummu_new(struct device *dev, struct msm_gpu *gpu)
94 {
95 	struct msm_gpummu *gpummu;
96 
97 	gpummu = kzalloc(sizeof(*gpummu), GFP_KERNEL);
98 	if (!gpummu)
99 		return ERR_PTR(-ENOMEM);
100 
101 	gpummu->table = dma_alloc_attrs(dev, TABLE_SIZE + 32, &gpummu->pt_base,
102 		GFP_KERNEL | __GFP_ZERO, DMA_ATTR_FORCE_CONTIGUOUS);
103 	if (!gpummu->table) {
104 		kfree(gpummu);
105 		return ERR_PTR(-ENOMEM);
106 	}
107 
108 	gpummu->gpu = gpu;
109 	msm_mmu_init(&gpummu->base, dev, &funcs, MSM_MMU_GPUMMU);
110 
111 	return &gpummu->base;
112 }
113 
msm_gpummu_params(struct msm_mmu * mmu,dma_addr_t * pt_base,dma_addr_t * tran_error)114 void msm_gpummu_params(struct msm_mmu *mmu, dma_addr_t *pt_base,
115 		dma_addr_t *tran_error)
116 {
117 	dma_addr_t base = to_msm_gpummu(mmu)->pt_base;
118 
119 	*pt_base = base;
120 	*tran_error = base + TABLE_SIZE; /* 32-byte aligned */
121 }
122