2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
29 #include <linux/pci.h>
30 #include <linux/vmalloc.h>
32 #include <drm/amdgpu_drm.h>
34 #include <asm/set_memory.h>
40 * The GART (Graphics Aperture Remapping Table) is an aperture
41 * in the GPU's address space. System pages can be mapped into
42 * the aperture and look like contiguous pages from the GPU's
43 * perspective. A page table maps the pages in the aperture
44 * to the actual backing pages in system memory.
46 * Radeon GPUs support both an internal GART, as described above,
47 * and AGP. AGP works similarly, but the GART table is configured
48 * and maintained by the northbridge rather than the driver.
49 * Radeon hw has a separate AGP aperture that is programmed to
50 * point to the AGP aperture provided by the northbridge and the
51 * requests are passed through to the northbridge aperture.
52 * Both AGP and internal GART can be used at the same time, however
53 * that is not currently supported by the driver.
55 * This file handles the common internal GART management.
59 * Common GART table functions.
63 * amdgpu_dummy_page_init - init dummy page used by the driver
65 * @adev: amdgpu_device pointer
67 * Allocate the dummy page used by the driver (all asics).
68 * This dummy page is used by the driver as a filler for gart entries
69 * when pages are taken out of the GART
70 * Returns 0 on sucess, -ENOMEM on failure.
72 static int amdgpu_gart_dummy_page_init(struct amdgpu_device
*adev
)
74 struct page
*dummy_page
= ttm_bo_glob
.dummy_read_page
;
76 if (adev
->dummy_page_addr
)
78 adev
->dummy_page_addr
= pci_map_page(adev
->pdev
, dummy_page
, 0,
79 PAGE_SIZE
, PCI_DMA_BIDIRECTIONAL
);
80 if (pci_dma_mapping_error(adev
->pdev
, adev
->dummy_page_addr
)) {
81 dev_err(&adev
->pdev
->dev
, "Failed to DMA MAP the dummy page\n");
82 adev
->dummy_page_addr
= 0;
89 * amdgpu_dummy_page_fini - free dummy page used by the driver
91 * @adev: amdgpu_device pointer
93 * Frees the dummy page used by the driver (all asics).
95 static void amdgpu_gart_dummy_page_fini(struct amdgpu_device
*adev
)
97 if (!adev
->dummy_page_addr
)
99 pci_unmap_page(adev
->pdev
, adev
->dummy_page_addr
,
100 PAGE_SIZE
, PCI_DMA_BIDIRECTIONAL
);
101 adev
->dummy_page_addr
= 0;
105 * amdgpu_gart_table_vram_alloc - allocate vram for gart page table
107 * @adev: amdgpu_device pointer
109 * Allocate video memory for GART page table
110 * (pcie r4xx, r5xx+). These asics require the
111 * gart table to be in video memory.
112 * Returns 0 for success, error for failure.
114 int amdgpu_gart_table_vram_alloc(struct amdgpu_device
*adev
)
118 if (adev
->gart
.bo
== NULL
) {
119 struct amdgpu_bo_param bp
;
121 memset(&bp
, 0, sizeof(bp
));
122 bp
.size
= adev
->gart
.table_size
;
123 bp
.byte_align
= PAGE_SIZE
;
124 bp
.domain
= AMDGPU_GEM_DOMAIN_VRAM
;
125 bp
.flags
= AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED
|
126 AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS
;
127 bp
.type
= ttm_bo_type_kernel
;
129 r
= amdgpu_bo_create(adev
, &bp
, &adev
->gart
.bo
);
138 * amdgpu_gart_table_vram_pin - pin gart page table in vram
140 * @adev: amdgpu_device pointer
142 * Pin the GART page table in vram so it will not be moved
143 * by the memory manager (pcie r4xx, r5xx+). These asics require the
144 * gart table to be in video memory.
145 * Returns 0 for success, error for failure.
147 int amdgpu_gart_table_vram_pin(struct amdgpu_device
*adev
)
151 r
= amdgpu_bo_reserve(adev
->gart
.bo
, false);
152 if (unlikely(r
!= 0))
154 r
= amdgpu_bo_pin(adev
->gart
.bo
, AMDGPU_GEM_DOMAIN_VRAM
);
156 amdgpu_bo_unreserve(adev
->gart
.bo
);
159 r
= amdgpu_bo_kmap(adev
->gart
.bo
, &adev
->gart
.ptr
);
161 amdgpu_bo_unpin(adev
->gart
.bo
);
162 amdgpu_bo_unreserve(adev
->gart
.bo
);
167 * amdgpu_gart_table_vram_unpin - unpin gart page table in vram
169 * @adev: amdgpu_device pointer
171 * Unpin the GART page table in vram (pcie r4xx, r5xx+).
172 * These asics require the gart table to be in video memory.
174 void amdgpu_gart_table_vram_unpin(struct amdgpu_device
*adev
)
178 if (adev
->gart
.bo
== NULL
) {
181 r
= amdgpu_bo_reserve(adev
->gart
.bo
, true);
182 if (likely(r
== 0)) {
183 amdgpu_bo_kunmap(adev
->gart
.bo
);
184 amdgpu_bo_unpin(adev
->gart
.bo
);
185 amdgpu_bo_unreserve(adev
->gart
.bo
);
186 adev
->gart
.ptr
= NULL
;
191 * amdgpu_gart_table_vram_free - free gart page table vram
193 * @adev: amdgpu_device pointer
195 * Free the video memory used for the GART page table
196 * (pcie r4xx, r5xx+). These asics require the gart table to
197 * be in video memory.
199 void amdgpu_gart_table_vram_free(struct amdgpu_device
*adev
)
201 if (adev
->gart
.bo
== NULL
) {
204 amdgpu_bo_unref(&adev
->gart
.bo
);
208 * Common gart functions.
211 * amdgpu_gart_unbind - unbind pages from the gart page table
213 * @adev: amdgpu_device pointer
214 * @offset: offset into the GPU's gart aperture
215 * @pages: number of pages to unbind
217 * Unbinds the requested pages from the gart page table and
218 * replaces them with the dummy page (all asics).
219 * Returns 0 for success, -EINVAL for failure.
221 int amdgpu_gart_unbind(struct amdgpu_device
*adev
, uint64_t offset
,
228 /* Starting from VEGA10, system bit must be 0 to mean invalid. */
231 if (!adev
->gart
.ready
) {
232 WARN(1, "trying to unbind memory from uninitialized GART !\n");
236 t
= offset
/ AMDGPU_GPU_PAGE_SIZE
;
237 p
= t
/ AMDGPU_GPU_PAGES_IN_CPU_PAGE
;
238 for (i
= 0; i
< pages
; i
++, p
++) {
239 #ifdef CONFIG_DRM_AMDGPU_GART_DEBUGFS
240 adev
->gart
.pages
[p
] = NULL
;
242 page_base
= adev
->dummy_page_addr
;
246 for (j
= 0; j
< AMDGPU_GPU_PAGES_IN_CPU_PAGE
; j
++, t
++) {
247 amdgpu_gmc_set_pte_pde(adev
, adev
->gart
.ptr
,
248 t
, page_base
, flags
);
249 page_base
+= AMDGPU_GPU_PAGE_SIZE
;
253 amdgpu_asic_flush_hdp(adev
, NULL
);
254 for (i
= 0; i
< adev
->num_vmhubs
; i
++)
255 amdgpu_gmc_flush_gpu_tlb(adev
, 0, i
, 0);
261 * amdgpu_gart_map - map dma_addresses into GART entries
263 * @adev: amdgpu_device pointer
264 * @offset: offset into the GPU's gart aperture
265 * @pages: number of pages to bind
266 * @dma_addr: DMA addresses of pages
267 * @flags: page table entry flags
268 * @dst: CPU address of the gart table
270 * Map the dma_addresses into GART entries (all asics).
271 * Returns 0 for success, -EINVAL for failure.
273 int amdgpu_gart_map(struct amdgpu_device
*adev
, uint64_t offset
,
274 int pages
, dma_addr_t
*dma_addr
, uint64_t flags
,
280 if (!adev
->gart
.ready
) {
281 WARN(1, "trying to bind memory to uninitialized GART !\n");
285 t
= offset
/ AMDGPU_GPU_PAGE_SIZE
;
287 for (i
= 0; i
< pages
; i
++) {
288 page_base
= dma_addr
[i
];
289 for (j
= 0; j
< AMDGPU_GPU_PAGES_IN_CPU_PAGE
; j
++, t
++) {
290 amdgpu_gmc_set_pte_pde(adev
, dst
, t
, page_base
, flags
);
291 page_base
+= AMDGPU_GPU_PAGE_SIZE
;
298 * amdgpu_gart_bind - bind pages into the gart page table
300 * @adev: amdgpu_device pointer
301 * @offset: offset into the GPU's gart aperture
302 * @pages: number of pages to bind
303 * @pagelist: pages to bind
304 * @dma_addr: DMA addresses of pages
305 * @flags: page table entry flags
307 * Binds the requested pages to the gart page table
309 * Returns 0 for success, -EINVAL for failure.
311 int amdgpu_gart_bind(struct amdgpu_device
*adev
, uint64_t offset
,
312 int pages
, struct page
**pagelist
, dma_addr_t
*dma_addr
,
315 #ifdef CONFIG_DRM_AMDGPU_GART_DEBUGFS
320 if (!adev
->gart
.ready
) {
321 WARN(1, "trying to bind memory to uninitialized GART !\n");
325 #ifdef CONFIG_DRM_AMDGPU_GART_DEBUGFS
326 t
= offset
/ AMDGPU_GPU_PAGE_SIZE
;
327 p
= t
/ AMDGPU_GPU_PAGES_IN_CPU_PAGE
;
328 for (i
= 0; i
< pages
; i
++, p
++)
329 adev
->gart
.pages
[p
] = pagelist
? pagelist
[i
] : NULL
;
335 r
= amdgpu_gart_map(adev
, offset
, pages
, dma_addr
, flags
,
341 amdgpu_asic_flush_hdp(adev
, NULL
);
342 for (i
= 0; i
< adev
->num_vmhubs
; i
++)
343 amdgpu_gmc_flush_gpu_tlb(adev
, 0, i
, 0);
348 * amdgpu_gart_init - init the driver info for managing the gart
350 * @adev: amdgpu_device pointer
352 * Allocate the dummy page and init the gart driver info (all asics).
353 * Returns 0 for success, error for failure.
355 int amdgpu_gart_init(struct amdgpu_device
*adev
)
359 if (adev
->dummy_page_addr
)
362 /* We need PAGE_SIZE >= AMDGPU_GPU_PAGE_SIZE */
363 if (PAGE_SIZE
< AMDGPU_GPU_PAGE_SIZE
) {
364 DRM_ERROR("Page size is smaller than GPU page size!\n");
367 r
= amdgpu_gart_dummy_page_init(adev
);
370 /* Compute table size */
371 adev
->gart
.num_cpu_pages
= adev
->gmc
.gart_size
/ PAGE_SIZE
;
372 adev
->gart
.num_gpu_pages
= adev
->gmc
.gart_size
/ AMDGPU_GPU_PAGE_SIZE
;
373 DRM_INFO("GART: num cpu pages %u, num gpu pages %u\n",
374 adev
->gart
.num_cpu_pages
, adev
->gart
.num_gpu_pages
);
376 #ifdef CONFIG_DRM_AMDGPU_GART_DEBUGFS
377 /* Allocate pages table */
378 adev
->gart
.pages
= vzalloc(array_size(sizeof(void *),
379 adev
->gart
.num_cpu_pages
));
380 if (adev
->gart
.pages
== NULL
)
388 * amdgpu_gart_fini - tear down the driver info for managing the gart
390 * @adev: amdgpu_device pointer
392 * Tear down the gart driver info and free the dummy page (all asics).
394 void amdgpu_gart_fini(struct amdgpu_device
*adev
)
396 #ifdef CONFIG_DRM_AMDGPU_GART_DEBUGFS
397 vfree(adev
->gart
.pages
);
398 adev
->gart
.pages
= NULL
;
400 amdgpu_gart_dummy_page_fini(adev
);