2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
29 #include <drm/radeon_drm.h>
34 * The GART (Graphics Aperture Remapping Table) is an aperture
35 * in the GPU's address space. System pages can be mapped into
36 * the aperture and look like contiguous pages from the GPU's
37 * perspective. A page table maps the pages in the aperture
38 * to the actual backing pages in system memory.
40 * Radeon GPUs support both an internal GART, as described above,
41 * and AGP. AGP works similarly, but the GART table is configured
42 * and maintained by the northbridge rather than the driver.
43 * Radeon hw has a separate AGP aperture that is programmed to
44 * point to the AGP aperture provided by the northbridge and the
45 * requests are passed through to the northbridge aperture.
46 * Both AGP and internal GART can be used at the same time, however
47 * that is not currently supported by the driver.
49 * This file handles the common internal GART management.
53 * Common GART table functions.
56 * radeon_gart_table_ram_alloc - allocate system ram for gart page table
58 * @rdev: radeon_device pointer
60 * Allocate system memory for GART page table
61 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
62 * gart table to be in system memory.
63 * Returns 0 for success, -ENOMEM for failure.
65 int radeon_gart_table_ram_alloc(struct radeon_device
*rdev
)
69 ptr
= pci_alloc_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
70 &rdev
->gart
.table_addr
);
75 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
76 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
77 set_memory_uc((unsigned long)ptr
,
78 rdev
->gart
.table_size
>> PAGE_SHIFT
);
82 memset((void *)rdev
->gart
.ptr
, 0, rdev
->gart
.table_size
);
87 * radeon_gart_table_ram_free - free system ram for gart page table
89 * @rdev: radeon_device pointer
91 * Free system memory for GART page table
92 * (r1xx-r3xx, non-pcie r4xx, rs400). These asics require the
93 * gart table to be in system memory.
95 void radeon_gart_table_ram_free(struct radeon_device
*rdev
)
97 if (rdev
->gart
.ptr
== NULL
) {
101 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
102 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
103 set_memory_wb((unsigned long)rdev
->gart
.ptr
,
104 rdev
->gart
.table_size
>> PAGE_SHIFT
);
107 pci_free_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
108 (void *)rdev
->gart
.ptr
,
109 rdev
->gart
.table_addr
);
110 rdev
->gart
.ptr
= NULL
;
111 rdev
->gart
.table_addr
= 0;
115 * radeon_gart_table_vram_alloc - allocate vram for gart page table
117 * @rdev: radeon_device pointer
119 * Allocate video memory for GART page table
120 * (pcie r4xx, r5xx+). These asics require the
121 * gart table to be in video memory.
122 * Returns 0 for success, error for failure.
124 int radeon_gart_table_vram_alloc(struct radeon_device
*rdev
)
128 if (rdev
->gart
.robj
== NULL
) {
129 r
= radeon_bo_create(rdev
, rdev
->gart
.table_size
,
130 PAGE_SIZE
, true, RADEON_GEM_DOMAIN_VRAM
,
131 NULL
, &rdev
->gart
.robj
);
140 * radeon_gart_table_vram_pin - pin gart page table in vram
142 * @rdev: radeon_device pointer
144 * Pin the GART page table in vram so it will not be moved
145 * by the memory manager (pcie r4xx, r5xx+). These asics require the
146 * gart table to be in video memory.
147 * Returns 0 for success, error for failure.
149 int radeon_gart_table_vram_pin(struct radeon_device
*rdev
)
154 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
155 if (unlikely(r
!= 0))
157 r
= radeon_bo_pin(rdev
->gart
.robj
,
158 RADEON_GEM_DOMAIN_VRAM
, &gpu_addr
);
160 radeon_bo_unreserve(rdev
->gart
.robj
);
163 r
= radeon_bo_kmap(rdev
->gart
.robj
, &rdev
->gart
.ptr
);
165 radeon_bo_unpin(rdev
->gart
.robj
);
166 radeon_bo_unreserve(rdev
->gart
.robj
);
167 rdev
->gart
.table_addr
= gpu_addr
;
172 * radeon_gart_table_vram_unpin - unpin gart page table in vram
174 * @rdev: radeon_device pointer
176 * Unpin the GART page table in vram (pcie r4xx, r5xx+).
177 * These asics require the gart table to be in video memory.
179 void radeon_gart_table_vram_unpin(struct radeon_device
*rdev
)
183 if (rdev
->gart
.robj
== NULL
) {
186 r
= radeon_bo_reserve(rdev
->gart
.robj
, false);
187 if (likely(r
== 0)) {
188 radeon_bo_kunmap(rdev
->gart
.robj
);
189 radeon_bo_unpin(rdev
->gart
.robj
);
190 radeon_bo_unreserve(rdev
->gart
.robj
);
191 rdev
->gart
.ptr
= NULL
;
196 * radeon_gart_table_vram_free - free gart page table vram
198 * @rdev: radeon_device pointer
200 * Free the video memory used for the GART page table
201 * (pcie r4xx, r5xx+). These asics require the gart table to
202 * be in video memory.
204 void radeon_gart_table_vram_free(struct radeon_device
*rdev
)
206 if (rdev
->gart
.robj
== NULL
) {
209 radeon_bo_unref(&rdev
->gart
.robj
);
213 * Common gart functions.
216 * radeon_gart_unbind - unbind pages from the gart page table
218 * @rdev: radeon_device pointer
219 * @offset: offset into the GPU's gart aperture
220 * @pages: number of pages to unbind
222 * Unbinds the requested pages from the gart page table and
223 * replaces them with the dummy page (all asics).
225 void radeon_gart_unbind(struct radeon_device
*rdev
, unsigned offset
,
233 if (!rdev
->gart
.ready
) {
234 WARN(1, "trying to unbind memory from uninitialized GART !\n");
237 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
238 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
239 for (i
= 0; i
< pages
; i
++, p
++) {
240 if (rdev
->gart
.pages
[p
]) {
241 rdev
->gart
.pages
[p
] = NULL
;
242 rdev
->gart
.pages_addr
[p
] = rdev
->dummy_page
.addr
;
243 page_base
= rdev
->gart
.pages_addr
[p
];
244 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
245 if (rdev
->gart
.ptr
) {
246 radeon_gart_set_page(rdev
, t
, page_base
);
248 page_base
+= RADEON_GPU_PAGE_SIZE
;
253 radeon_gart_tlb_flush(rdev
);
257 * radeon_gart_bind - bind pages into the gart page table
259 * @rdev: radeon_device pointer
260 * @offset: offset into the GPU's gart aperture
261 * @pages: number of pages to bind
262 * @pagelist: pages to bind
263 * @dma_addr: DMA addresses of pages
265 * Binds the requested pages to the gart page table
267 * Returns 0 for success, -EINVAL for failure.
269 int radeon_gart_bind(struct radeon_device
*rdev
, unsigned offset
,
270 int pages
, struct page
**pagelist
, dma_addr_t
*dma_addr
)
277 if (!rdev
->gart
.ready
) {
278 WARN(1, "trying to bind memory to uninitialized GART !\n");
281 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
282 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
284 for (i
= 0; i
< pages
; i
++, p
++) {
285 rdev
->gart
.pages_addr
[p
] = dma_addr
[i
];
286 rdev
->gart
.pages
[p
] = pagelist
[i
];
287 if (rdev
->gart
.ptr
) {
288 page_base
= rdev
->gart
.pages_addr
[p
];
289 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
290 radeon_gart_set_page(rdev
, t
, page_base
);
291 page_base
+= RADEON_GPU_PAGE_SIZE
;
296 radeon_gart_tlb_flush(rdev
);
301 * radeon_gart_restore - bind all pages in the gart page table
303 * @rdev: radeon_device pointer
305 * Binds all pages in the gart page table (all asics).
306 * Used to rebuild the gart table on device startup or resume.
308 void radeon_gart_restore(struct radeon_device
*rdev
)
313 if (!rdev
->gart
.ptr
) {
316 for (i
= 0, t
= 0; i
< rdev
->gart
.num_cpu_pages
; i
++) {
317 page_base
= rdev
->gart
.pages_addr
[i
];
318 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
319 radeon_gart_set_page(rdev
, t
, page_base
);
320 page_base
+= RADEON_GPU_PAGE_SIZE
;
324 radeon_gart_tlb_flush(rdev
);
328 * radeon_gart_init - init the driver info for managing the gart
330 * @rdev: radeon_device pointer
332 * Allocate the dummy page and init the gart driver info (all asics).
333 * Returns 0 for success, error for failure.
335 int radeon_gart_init(struct radeon_device
*rdev
)
339 if (rdev
->gart
.pages
) {
342 /* We need PAGE_SIZE >= RADEON_GPU_PAGE_SIZE */
343 if (PAGE_SIZE
< RADEON_GPU_PAGE_SIZE
) {
344 DRM_ERROR("Page size is smaller than GPU page size!\n");
347 r
= radeon_dummy_page_init(rdev
);
350 /* Compute table size */
351 rdev
->gart
.num_cpu_pages
= rdev
->mc
.gtt_size
/ PAGE_SIZE
;
352 rdev
->gart
.num_gpu_pages
= rdev
->mc
.gtt_size
/ RADEON_GPU_PAGE_SIZE
;
353 DRM_INFO("GART: num cpu pages %u, num gpu pages %u\n",
354 rdev
->gart
.num_cpu_pages
, rdev
->gart
.num_gpu_pages
);
355 /* Allocate pages table */
356 rdev
->gart
.pages
= vzalloc(sizeof(void *) * rdev
->gart
.num_cpu_pages
);
357 if (rdev
->gart
.pages
== NULL
) {
358 radeon_gart_fini(rdev
);
361 rdev
->gart
.pages_addr
= vzalloc(sizeof(dma_addr_t
) *
362 rdev
->gart
.num_cpu_pages
);
363 if (rdev
->gart
.pages_addr
== NULL
) {
364 radeon_gart_fini(rdev
);
367 /* set GART entry to point to the dummy page by default */
368 for (i
= 0; i
< rdev
->gart
.num_cpu_pages
; i
++) {
369 rdev
->gart
.pages_addr
[i
] = rdev
->dummy_page
.addr
;
375 * radeon_gart_fini - tear down the driver info for managing the gart
377 * @rdev: radeon_device pointer
379 * Tear down the gart driver info and free the dummy page (all asics).
381 void radeon_gart_fini(struct radeon_device
*rdev
)
383 if (rdev
->gart
.pages
&& rdev
->gart
.pages_addr
&& rdev
->gart
.ready
) {
385 radeon_gart_unbind(rdev
, 0, rdev
->gart
.num_cpu_pages
);
387 rdev
->gart
.ready
= false;
388 vfree(rdev
->gart
.pages
);
389 vfree(rdev
->gart
.pages_addr
);
390 rdev
->gart
.pages
= NULL
;
391 rdev
->gart
.pages_addr
= NULL
;
393 radeon_dummy_page_fini(rdev
);