2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
29 #include <drm/radeon_drm.h>
34 * The GART (Graphics Aperture Remapping Table) is an aperture
35 * in the GPU's address space. System pages can be mapped into
36 * the aperture and look like contiguous pages from the GPU's
37 * perspective. A page table maps the pages in the aperture
38 * to the actual backing pages in system memory.
40 * Radeon GPUs support both an internal GART, as described above,
41 * and AGP. AGP works similarly, but the GART table is configured
42 * and maintained by the northbridge rather than the driver.
43 * Radeon hw has a separate AGP aperture that is programmed to
44 * point to the AGP aperture provided by the northbridge and the
45 * requests are passed through to the northbridge aperture.
46 * Both AGP and internal GART can be used at the same time, however
47 * that is not currently supported by the driver.
49 * This file handles the common internal GART management.
53 * Common GART table functions.
56 * radeon_gart_table_ram_alloc - allocate system ram for gart page table
58 * @rdev: radeon_device pointer
60 * Allocate system memory for GART page table
61 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
62 * gart table to be in system memory.
63 * Returns 0 for success, -ENOMEM for failure.
65 int radeon_gart_table_ram_alloc(struct radeon_device
*rdev
)
69 ptr
= pci_alloc_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
70 &rdev
->gart
.table_addr
);
75 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
76 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
77 set_memory_uc((unsigned long)ptr
,
78 rdev
->gart
.table_size
>> PAGE_SHIFT
);
82 memset((void *)rdev
->gart
.ptr
, 0, rdev
->gart
.table_size
);
87 * radeon_gart_table_ram_free - free system ram for gart page table
89 * @rdev: radeon_device pointer
91 * Free system memory for GART page table
92 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
93 * gart table to be in system memory.
95 void radeon_gart_table_ram_free(struct radeon_device
*rdev
)
97 if (rdev
->gart
.ptr
== NULL
) {
101 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
102 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
103 set_memory_wb((unsigned long)rdev
->gart
.ptr
,
104 rdev
->gart
.table_size
>> PAGE_SHIFT
);
107 pci_free_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
108 (void *)rdev
->gart
.ptr
,
109 rdev
->gart
.table_addr
);
110 rdev
->gart
.ptr
= NULL
;
111 rdev
->gart
.table_addr
= 0;
115 * radeon_gart_table_vram_alloc - allocate vram for gart page table
117 * @rdev: radeon_device pointer
119 * Allocate video memory for GART page table
120 * (pcie r4xx, r5xx+). These asics require the
121 * gart table to be in video memory.
122 * Returns 0 for success, error for failure.
124 int radeon_gart_table_vram_alloc(struct radeon_device
*rdev
)
128 if (rdev
->gart
.robj
== NULL
) {
129 r
= radeon_bo_create(rdev
, rdev
->gart
.table_size
,
130 PAGE_SIZE
, true, RADEON_GEM_DOMAIN_VRAM
,
131 0, NULL
, NULL
, &rdev
->gart
.robj
);
140 * radeon_gart_table_vram_pin - pin gart page table in vram
142 * @rdev: radeon_device pointer
144 * Pin the GART page table in vram so it will not be moved
145 * by the memory manager (pcie r4xx, r5xx+). These asics require the
146 * gart table to be in video memory.
147 * Returns 0 for success, error for failure.
149 int radeon_gart_table_vram_pin(struct radeon_device
*rdev
)
154 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
155 if (unlikely(r
!= 0))
157 r
= radeon_bo_pin(rdev
->gart
.robj
,
158 RADEON_GEM_DOMAIN_VRAM
, &gpu_addr
);
160 radeon_bo_unreserve(rdev
->gart
.robj
);
163 r
= radeon_bo_kmap(rdev
->gart
.robj
, &rdev
->gart
.ptr
);
165 radeon_bo_unpin(rdev
->gart
.robj
);
166 radeon_bo_unreserve(rdev
->gart
.robj
);
167 rdev
->gart
.table_addr
= gpu_addr
;
172 /* We might have dropped some GART table updates while it wasn't
173 * mapped, restore all entries
175 for (i
= 0; i
< rdev
->gart
.num_gpu_pages
; i
++)
176 radeon_gart_set_page(rdev
, i
, rdev
->gart
.pages_entry
[i
]);
178 radeon_gart_tlb_flush(rdev
);
185 * radeon_gart_table_vram_unpin - unpin gart page table in vram
187 * @rdev: radeon_device pointer
189 * Unpin the GART page table in vram (pcie r4xx, r5xx+).
190 * These asics require the gart table to be in video memory.
192 void radeon_gart_table_vram_unpin(struct radeon_device
*rdev
)
196 if (rdev
->gart
.robj
== NULL
) {
199 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
200 if (likely(r
== 0)) {
201 radeon_bo_kunmap(rdev
->gart
.robj
);
202 radeon_bo_unpin(rdev
->gart
.robj
);
203 radeon_bo_unreserve(rdev
->gart
.robj
);
204 rdev
->gart
.ptr
= NULL
;
209 * radeon_gart_table_vram_free - free gart page table vram
211 * @rdev: radeon_device pointer
213 * Free the video memory used for the GART page table
214 * (pcie r4xx, r5xx+). These asics require the gart table to
215 * be in video memory.
217 void radeon_gart_table_vram_free(struct radeon_device
*rdev
)
219 if (rdev
->gart
.robj
== NULL
) {
222 radeon_bo_unref(&rdev
->gart
.robj
);
226 * Common gart functions.
229 * radeon_gart_unbind - unbind pages from the gart page table
231 * @rdev: radeon_device pointer
232 * @offset: offset into the GPU's gart aperture
233 * @pages: number of pages to unbind
235 * Unbinds the requested pages from the gart page table and
236 * replaces them with the dummy page (all asics).
238 void radeon_gart_unbind(struct radeon_device
*rdev
, unsigned offset
,
245 if (!rdev
->gart
.ready
) {
246 WARN(1, "trying to unbind memory from uninitialized GART !\n");
249 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
250 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
251 for (i
= 0; i
< pages
; i
++, p
++) {
252 if (rdev
->gart
.pages
[p
]) {
253 rdev
->gart
.pages
[p
] = NULL
;
254 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
255 rdev
->gart
.pages_entry
[t
] = rdev
->dummy_page
.entry
;
256 if (rdev
->gart
.ptr
) {
257 radeon_gart_set_page(rdev
, t
,
258 rdev
->dummy_page
.entry
);
263 if (rdev
->gart
.ptr
) {
265 radeon_gart_tlb_flush(rdev
);
270 * radeon_gart_bind - bind pages into the gart page table
272 * @rdev: radeon_device pointer
273 * @offset: offset into the GPU's gart aperture
274 * @pages: number of pages to bind
275 * @pagelist: pages to bind
276 * @dma_addr: DMA addresses of pages
277 * @flags: RADEON_GART_PAGE_* flags
279 * Binds the requested pages to the gart page table
281 * Returns 0 for success, -EINVAL for failure.
283 int radeon_gart_bind(struct radeon_device
*rdev
, unsigned offset
,
284 int pages
, struct page
**pagelist
, dma_addr_t
*dma_addr
,
289 uint64_t page_base
, page_entry
;
292 if (!rdev
->gart
.ready
) {
293 WARN(1, "trying to bind memory to uninitialized GART !\n");
296 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
297 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
299 for (i
= 0; i
< pages
; i
++, p
++) {
300 rdev
->gart
.pages
[p
] = pagelist
[i
];
301 page_base
= dma_addr
[i
];
302 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
303 page_entry
= radeon_gart_get_page_entry(page_base
, flags
);
304 rdev
->gart
.pages_entry
[t
] = page_entry
;
305 if (rdev
->gart
.ptr
) {
306 radeon_gart_set_page(rdev
, t
, page_entry
);
308 page_base
+= RADEON_GPU_PAGE_SIZE
;
311 if (rdev
->gart
.ptr
) {
313 radeon_gart_tlb_flush(rdev
);
319 * radeon_gart_init - init the driver info for managing the gart
321 * @rdev: radeon_device pointer
323 * Allocate the dummy page and init the gart driver info (all asics).
324 * Returns 0 for success, error for failure.
326 int radeon_gart_init(struct radeon_device
*rdev
)
330 if (rdev
->gart
.pages
) {
333 /* We need PAGE_SIZE >= RADEON_GPU_PAGE_SIZE */
334 if (PAGE_SIZE
< RADEON_GPU_PAGE_SIZE
) {
335 DRM_ERROR("Page size is smaller than GPU page size!\n");
338 r
= radeon_dummy_page_init(rdev
);
341 /* Compute table size */
342 rdev
->gart
.num_cpu_pages
= rdev
->mc
.gtt_size
/ PAGE_SIZE
;
343 rdev
->gart
.num_gpu_pages
= rdev
->mc
.gtt_size
/ RADEON_GPU_PAGE_SIZE
;
344 DRM_INFO("GART: num cpu pages %u, num gpu pages %u\n",
345 rdev
->gart
.num_cpu_pages
, rdev
->gart
.num_gpu_pages
);
346 /* Allocate pages table */
347 rdev
->gart
.pages
= vzalloc(sizeof(void *) * rdev
->gart
.num_cpu_pages
);
348 if (rdev
->gart
.pages
== NULL
) {
349 radeon_gart_fini(rdev
);
352 rdev
->gart
.pages_entry
= vmalloc(sizeof(uint64_t) *
353 rdev
->gart
.num_gpu_pages
);
354 if (rdev
->gart
.pages_entry
== NULL
) {
355 radeon_gart_fini(rdev
);
358 /* set GART entry to point to the dummy page by default */
359 for (i
= 0; i
< rdev
->gart
.num_gpu_pages
; i
++)
360 rdev
->gart
.pages_entry
[i
] = rdev
->dummy_page
.entry
;
365 * radeon_gart_fini - tear down the driver info for managing the gart
367 * @rdev: radeon_device pointer
369 * Tear down the gart driver info and free the dummy page (all asics).
371 void radeon_gart_fini(struct radeon_device
*rdev
)
373 if (rdev
->gart
.ready
) {
375 radeon_gart_unbind(rdev
, 0, rdev
->gart
.num_cpu_pages
);
377 rdev
->gart
.ready
= false;
378 vfree(rdev
->gart
.pages
);
379 vfree(rdev
->gart
.pages_entry
);
380 rdev
->gart
.pages
= NULL
;
381 rdev
->gart
.pages_entry
= NULL
;
383 radeon_dummy_page_fini(rdev
);