2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
29 #include "radeon_drm.h"
31 #include "radeon_reg.h"
34 * Common GART table functions.
36 int radeon_gart_table_ram_alloc(struct radeon_device
*rdev
)
40 ptr
= pci_alloc_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
41 &rdev
->gart
.table_addr
);
46 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
47 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
48 set_memory_uc((unsigned long)ptr
,
49 rdev
->gart
.table_size
>> PAGE_SHIFT
);
52 rdev
->gart
.table
.ram
.ptr
= ptr
;
53 memset((void *)rdev
->gart
.table
.ram
.ptr
, 0, rdev
->gart
.table_size
);
57 void radeon_gart_table_ram_free(struct radeon_device
*rdev
)
59 if (rdev
->gart
.table
.ram
.ptr
== NULL
) {
63 if (rdev
->family
== CHIP_RS400
|| rdev
->family
== CHIP_RS480
||
64 rdev
->family
== CHIP_RS690
|| rdev
->family
== CHIP_RS740
) {
65 set_memory_wb((unsigned long)rdev
->gart
.table
.ram
.ptr
,
66 rdev
->gart
.table_size
>> PAGE_SHIFT
);
69 pci_free_consistent(rdev
->pdev
, rdev
->gart
.table_size
,
70 (void *)rdev
->gart
.table
.ram
.ptr
,
71 rdev
->gart
.table_addr
);
72 rdev
->gart
.table
.ram
.ptr
= NULL
;
73 rdev
->gart
.table_addr
= 0;
76 int radeon_gart_table_vram_alloc(struct radeon_device
*rdev
)
80 if (rdev
->gart
.table
.vram
.robj
== NULL
) {
81 r
= radeon_bo_create(rdev
, NULL
, rdev
->gart
.table_size
,
82 true, RADEON_GEM_DOMAIN_VRAM
,
83 &rdev
->gart
.table
.vram
.robj
);
91 int radeon_gart_table_vram_pin(struct radeon_device
*rdev
)
96 r
= radeon_bo_reserve(rdev
->gart
.table
.vram
.robj
, false);
99 r
= radeon_bo_pin(rdev
->gart
.table
.vram
.robj
,
100 RADEON_GEM_DOMAIN_VRAM
, &gpu_addr
);
102 radeon_bo_unreserve(rdev
->gart
.table
.vram
.robj
);
105 r
= radeon_bo_kmap(rdev
->gart
.table
.vram
.robj
,
106 (void **)&rdev
->gart
.table
.vram
.ptr
);
108 radeon_bo_unpin(rdev
->gart
.table
.vram
.robj
);
109 radeon_bo_unreserve(rdev
->gart
.table
.vram
.robj
);
110 rdev
->gart
.table_addr
= gpu_addr
;
114 void radeon_gart_table_vram_free(struct radeon_device
*rdev
)
118 if (rdev
->gart
.table
.vram
.robj
== NULL
) {
121 r
= radeon_bo_reserve(rdev
->gart
.table
.vram
.robj
, false);
122 if (likely(r
== 0)) {
123 radeon_bo_kunmap(rdev
->gart
.table
.vram
.robj
);
124 radeon_bo_unpin(rdev
->gart
.table
.vram
.robj
);
125 radeon_bo_unreserve(rdev
->gart
.table
.vram
.robj
);
127 radeon_bo_unref(&rdev
->gart
.table
.vram
.robj
);
134 * Common gart functions.
136 void radeon_gart_unbind(struct radeon_device
*rdev
, unsigned offset
,
144 if (!rdev
->gart
.ready
) {
145 WARN(1, "trying to unbind memory to unitialized GART !\n");
148 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
149 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
150 for (i
= 0; i
< pages
; i
++, p
++) {
151 if (rdev
->gart
.pages
[p
]) {
152 pci_unmap_page(rdev
->pdev
, rdev
->gart
.pages_addr
[p
],
153 PAGE_SIZE
, PCI_DMA_BIDIRECTIONAL
);
154 rdev
->gart
.pages
[p
] = NULL
;
155 rdev
->gart
.pages_addr
[p
] = rdev
->dummy_page
.addr
;
156 page_base
= rdev
->gart
.pages_addr
[p
];
157 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
158 radeon_gart_set_page(rdev
, t
, page_base
);
159 page_base
+= RADEON_GPU_PAGE_SIZE
;
164 radeon_gart_tlb_flush(rdev
);
167 int radeon_gart_bind(struct radeon_device
*rdev
, unsigned offset
,
168 int pages
, struct page
**pagelist
)
175 if (!rdev
->gart
.ready
) {
176 DRM_ERROR("trying to bind memory to unitialized GART !\n");
179 t
= offset
/ RADEON_GPU_PAGE_SIZE
;
180 p
= t
/ (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
);
182 for (i
= 0; i
< pages
; i
++, p
++) {
183 /* we need to support large memory configurations */
184 /* assume that unbind have already been call on the range */
185 rdev
->gart
.pages_addr
[p
] = pci_map_page(rdev
->pdev
, pagelist
[i
],
187 PCI_DMA_BIDIRECTIONAL
);
188 if (pci_dma_mapping_error(rdev
->pdev
, rdev
->gart
.pages_addr
[p
])) {
189 /* FIXME: failed to map page (return -ENOMEM?) */
190 radeon_gart_unbind(rdev
, offset
, pages
);
193 rdev
->gart
.pages
[p
] = pagelist
[i
];
194 page_base
= rdev
->gart
.pages_addr
[p
];
195 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
196 radeon_gart_set_page(rdev
, t
, page_base
);
197 page_base
+= RADEON_GPU_PAGE_SIZE
;
201 radeon_gart_tlb_flush(rdev
);
205 void radeon_gart_restore(struct radeon_device
*rdev
)
210 for (i
= 0, t
= 0; i
< rdev
->gart
.num_cpu_pages
; i
++) {
211 page_base
= rdev
->gart
.pages_addr
[i
];
212 for (j
= 0; j
< (PAGE_SIZE
/ RADEON_GPU_PAGE_SIZE
); j
++, t
++) {
213 radeon_gart_set_page(rdev
, t
, page_base
);
214 page_base
+= RADEON_GPU_PAGE_SIZE
;
218 radeon_gart_tlb_flush(rdev
);
221 int radeon_gart_init(struct radeon_device
*rdev
)
225 if (rdev
->gart
.pages
) {
228 /* We need PAGE_SIZE >= RADEON_GPU_PAGE_SIZE */
229 if (PAGE_SIZE
< RADEON_GPU_PAGE_SIZE
) {
230 DRM_ERROR("Page size is smaller than GPU page size!\n");
233 r
= radeon_dummy_page_init(rdev
);
236 /* Compute table size */
237 rdev
->gart
.num_cpu_pages
= rdev
->mc
.gtt_size
/ PAGE_SIZE
;
238 rdev
->gart
.num_gpu_pages
= rdev
->mc
.gtt_size
/ RADEON_GPU_PAGE_SIZE
;
239 DRM_INFO("GART: num cpu pages %u, num gpu pages %u\n",
240 rdev
->gart
.num_cpu_pages
, rdev
->gart
.num_gpu_pages
);
241 /* Allocate pages table */
242 rdev
->gart
.pages
= kzalloc(sizeof(void *) * rdev
->gart
.num_cpu_pages
,
244 if (rdev
->gart
.pages
== NULL
) {
245 radeon_gart_fini(rdev
);
248 rdev
->gart
.pages_addr
= kzalloc(sizeof(dma_addr_t
) *
249 rdev
->gart
.num_cpu_pages
, GFP_KERNEL
);
250 if (rdev
->gart
.pages_addr
== NULL
) {
251 radeon_gart_fini(rdev
);
254 /* set GART entry to point to the dummy page by default */
255 for (i
= 0; i
< rdev
->gart
.num_cpu_pages
; i
++) {
256 rdev
->gart
.pages_addr
[i
] = rdev
->dummy_page
.addr
;
261 void radeon_gart_fini(struct radeon_device
*rdev
)
263 if (rdev
->gart
.pages
&& rdev
->gart
.pages_addr
&& rdev
->gart
.ready
) {
265 radeon_gart_unbind(rdev
, 0, rdev
->gart
.num_cpu_pages
);
267 rdev
->gart
.ready
= false;
268 kfree(rdev
->gart
.pages
);
269 kfree(rdev
->gart
.pages_addr
);
270 rdev
->gart
.pages
= NULL
;
271 rdev
->gart
.pages_addr
= NULL
;