2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
29 #include <drm/radeon_drm.h>
31 #include <asm/set_memory.h>
37 * The GART (Graphics Aperture Remapping Table) is an aperture
38 * in the GPU's address space. System pages can be mapped into
39 * the aperture and look like contiguous pages from the GPU's
40 * perspective. A page table maps the pages in the aperture
41 * to the actual backing pages in system memory.
43 * Radeon GPUs support both an internal GART, as described above,
44 * and AGP. AGP works similarly, but the GART table is configured
45 * and maintained by the northbridge rather than the driver.
46 * Radeon hw has a separate AGP aperture that is programmed to
47 * point to the AGP aperture provided by the northbridge and the
48 * requests are passed through to the northbridge aperture.
49 * Both AGP and internal GART can be used at the same time, however
50 * that is not currently supported by the driver.
52 * This file handles the common internal GART management.
56 * Common GART table functions.
59 * radeon_gart_table_ram_alloc - allocate system ram for gart page table
61 * @rdev: radeon_device pointer
63 * Allocate system memory for GART page table
64 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
65 * gart table to be in system memory.
66 * Returns 0 for success, -ENOMEM for failure.
68 int radeon_gart_table_ram_alloc(struct radeon_device
*rdev
)
72 ptr
= pci_alloc_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
73 &rdev
->gart
.table_addr
);
78 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
79 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
80 set_memory_uc((unsigned long)ptr
,
81 rdev
->gart
.table_size
>> PAGE_SHIFT
);
85 memset((void *)rdev
->gart
.ptr
, 0, rdev
->gart
.table_size
);
90 * radeon_gart_table_ram_free - free system ram for gart page table
92 * @rdev: radeon_device pointer
94 * Free system memory for GART page table
95 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
96 * gart table to be in system memory.
98 void radeon_gart_table_ram_free(struct radeon_device
*rdev
)
100 if (rdev
->gart
.ptr
== NULL
) {
104 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
105 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
106 set_memory_wb((unsigned long)rdev
->gart
.ptr
,
107 rdev
->gart
.table_size
>> PAGE_SHIFT
);
110 pci_free_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
111 (void *)rdev
->gart
.ptr
,
112 rdev
->gart
.table_addr
);
113 rdev
->gart
.ptr
= NULL
;
114 rdev
->gart
.table_addr
= 0;
118 * radeon_gart_table_vram_alloc - allocate vram for gart page table
120 * @rdev: radeon_device pointer
122 * Allocate video memory for GART page table
123 * (pcie r4xx, r5xx+). These asics require the
124 * gart table to be in video memory.
125 * Returns 0 for success, error for failure.
127 int radeon_gart_table_vram_alloc(struct radeon_device
*rdev
)
131 if (rdev
->gart
.robj
== NULL
) {
132 r
= radeon_bo_create(rdev
, rdev
->gart
.table_size
,
133 PAGE_SIZE
, true, RADEON_GEM_DOMAIN_VRAM
,
134 0, NULL
, NULL
, &rdev
->gart
.robj
);
143 * radeon_gart_table_vram_pin - pin gart page table in vram
145 * @rdev: radeon_device pointer
147 * Pin the GART page table in vram so it will not be moved
148 * by the memory manager (pcie r4xx, r5xx+). These asics require the
149 * gart table to be in video memory.
150 * Returns 0 for success, error for failure.
152 int radeon_gart_table_vram_pin(struct radeon_device
*rdev
)
157 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
158 if (unlikely(r
!= 0))
160 r
= radeon_bo_pin(rdev
->gart
.robj
,
161 RADEON_GEM_DOMAIN_VRAM
, &gpu_addr
);
163 radeon_bo_unreserve(rdev
->gart
.robj
);
166 r
= radeon_bo_kmap(rdev
->gart
.robj
, &rdev
->gart
.ptr
);
168 radeon_bo_unpin(rdev
->gart
.robj
);
169 radeon_bo_unreserve(rdev
->gart
.robj
);
170 rdev
->gart
.table_addr
= gpu_addr
;
175 /* We might have dropped some GART table updates while it wasn't
176 * mapped, restore all entries
178 for (i
= 0; i
< rdev
->gart
.num_gpu_pages
; i
++)
179 radeon_gart_set_page(rdev
, i
, rdev
->gart
.pages_entry
[i
]);
181 radeon_gart_tlb_flush(rdev
);
188 * radeon_gart_table_vram_unpin - unpin gart page table in vram
190 * @rdev: radeon_device pointer
192 * Unpin the GART page table in vram (pcie r4xx, r5xx+).
193 * These asics require the gart table to be in video memory.
195 void radeon_gart_table_vram_unpin(struct radeon_device
*rdev
)
199 if (rdev
->gart
.robj
== NULL
) {
202 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
203 if (likely(r
== 0)) {
204 radeon_bo_kunmap(rdev
->gart
.robj
);
205 radeon_bo_unpin(rdev
->gart
.robj
);
206 radeon_bo_unreserve(rdev
->gart
.robj
);
207 rdev
->gart
.ptr
= NULL
;
212 * radeon_gart_table_vram_free - free gart page table vram
214 * @rdev: radeon_device pointer
216 * Free the video memory used for the GART page table
217 * (pcie r4xx, r5xx+). These asics require the gart table to
218 * be in video memory.
220 void radeon_gart_table_vram_free(struct radeon_device
*rdev
)
222 if (rdev
->gart
.robj
== NULL
) {
225 radeon_bo_unref(&rdev
->gart
.robj
);
229 * Common gart functions.
232 * radeon_gart_unbind - unbind pages from the gart page table
234 * @rdev: radeon_device pointer
235 * @offset: offset into the GPU's gart aperture
236 * @pages: number of pages to unbind
238 * Unbinds the requested pages from the gart page table and
239 * replaces them with the dummy page (all asics).
241 void radeon_gart_unbind(struct radeon_device
*rdev
, unsigned offset
,
248 if (!rdev
->gart
.ready
) {
249 WARN(1, "trying to unbind memory from uninitialized GART !\n");
252 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
253 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
254 for (i
= 0; i
< pages
; i
++, p
++) {
255 if (rdev
->gart
.pages
[p
]) {
256 rdev
->gart
.pages
[p
] = NULL
;
257 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
258 rdev
->gart
.pages_entry
[t
] = rdev
->dummy_page
.entry
;
259 if (rdev
->gart
.ptr
) {
260 radeon_gart_set_page(rdev
, t
,
261 rdev
->dummy_page
.entry
);
266 if (rdev
->gart
.ptr
) {
268 radeon_gart_tlb_flush(rdev
);
273 * radeon_gart_bind - bind pages into the gart page table
275 * @rdev: radeon_device pointer
276 * @offset: offset into the GPU's gart aperture
277 * @pages: number of pages to bind
278 * @pagelist: pages to bind
279 * @dma_addr: DMA addresses of pages
280 * @flags: RADEON_GART_PAGE_* flags
282 * Binds the requested pages to the gart page table
284 * Returns 0 for success, -EINVAL for failure.
286 int radeon_gart_bind(struct radeon_device
*rdev
, unsigned offset
,
287 int pages
, struct page
**pagelist
, dma_addr_t
*dma_addr
,
292 uint64_t page_base
, page_entry
;
295 if (!rdev
->gart
.ready
) {
296 WARN(1, "trying to bind memory to uninitialized GART !\n");
299 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
300 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
302 for (i
= 0; i
< pages
; i
++, p
++) {
303 rdev
->gart
.pages
[p
] = pagelist
[i
];
304 page_base
= dma_addr
[i
];
305 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
306 page_entry
= radeon_gart_get_page_entry(page_base
, flags
);
307 rdev
->gart
.pages_entry
[t
] = page_entry
;
308 if (rdev
->gart
.ptr
) {
309 radeon_gart_set_page(rdev
, t
, page_entry
);
311 page_base
+= RADEON_GPU_PAGE_SIZE
;
314 if (rdev
->gart
.ptr
) {
316 radeon_gart_tlb_flush(rdev
);
322 * radeon_gart_init - init the driver info for managing the gart
324 * @rdev: radeon_device pointer
326 * Allocate the dummy page and init the gart driver info (all asics).
327 * Returns 0 for success, error for failure.
329 int radeon_gart_init(struct radeon_device
*rdev
)
333 if (rdev
->gart
.pages
) {
336 /* We need PAGE_SIZE >= RADEON_GPU_PAGE_SIZE */
337 if (PAGE_SIZE
< RADEON_GPU_PAGE_SIZE
) {
338 DRM_ERROR("Page size is smaller than GPU page size!\n");
341 r
= radeon_dummy_page_init(rdev
);
344 /* Compute table size */
345 rdev
->gart
.num_cpu_pages
= rdev
->mc
.gtt_size
/ PAGE_SIZE
;
346 rdev
->gart
.num_gpu_pages
= rdev
->mc
.gtt_size
/ RADEON_GPU_PAGE_SIZE
;
347 DRM_INFO("GART: num cpu pages %u, num gpu pages %u\n",
348 rdev
->gart
.num_cpu_pages
, rdev
->gart
.num_gpu_pages
);
349 /* Allocate pages table */
350 rdev
->gart
.pages
= vzalloc(array_size(sizeof(void *),
351 rdev
->gart
.num_cpu_pages
));
352 if (rdev
->gart
.pages
== NULL
) {
353 radeon_gart_fini(rdev
);
356 rdev
->gart
.pages_entry
= vmalloc(array_size(sizeof(uint64_t),
357 rdev
->gart
.num_gpu_pages
));
358 if (rdev
->gart
.pages_entry
== NULL
) {
359 radeon_gart_fini(rdev
);
362 /* set GART entry to point to the dummy page by default */
363 for (i
= 0; i
< rdev
->gart
.num_gpu_pages
; i
++)
364 rdev
->gart
.pages_entry
[i
] = rdev
->dummy_page
.entry
;
369 * radeon_gart_fini - tear down the driver info for managing the gart
371 * @rdev: radeon_device pointer
373 * Tear down the gart driver info and free the dummy page (all asics).
375 void radeon_gart_fini(struct radeon_device
*rdev
)
377 if (rdev
->gart
.ready
) {
379 radeon_gart_unbind(rdev
, 0, rdev
->gart
.num_cpu_pages
);
381 rdev
->gart
.ready
= false;
382 vfree(rdev
->gart
.pages
);
383 vfree(rdev
->gart
.pages_entry
);
384 rdev
->gart
.pages
= NULL
;
385 rdev
->gart
.pages_entry
= NULL
;
387 radeon_dummy_page_fini(rdev
);