2 * Cell Broadband Engine OProfile Support
4 * (C) Copyright IBM Corporation 2006
6 * Author: Maynard Johnson <maynardj@us.ibm.com>
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
14 /* The code in this source file is responsible for generating
15 * vma-to-fileOffset maps for both overlay and non-overlay SPU
20 #include <linux/string.h>
21 #include <linux/uaccess.h>
22 #include <linux/elf.h>
26 void vma_map_free(struct vma_to_fileoffset_map
*map
)
29 struct vma_to_fileoffset_map
*next
= map
->next
;
36 vma_map_lookup(struct vma_to_fileoffset_map
*map
, unsigned int vma
,
37 const struct spu
*aSpu
, int *grd_val
)
40 * Default the offset to the physical address + a flag value.
41 * Addresses of dynamically generated code can't be found in the vma
42 * map. For those addresses the flagged value will be sent on to
43 * the user space tools so they can be reported rather than just
46 u32 offset
= 0x10000000 + vma
;
49 for (; map
; map
= map
->next
) {
50 if (vma
< map
->vma
|| vma
>= map
->vma
+ map
->size
)
54 ovly_grd
= *(u32
*)(aSpu
->local_store
+ map
->guard_ptr
);
55 if (ovly_grd
!= map
->guard_val
)
59 offset
= vma
- map
->vma
+ map
->offset
;
66 static struct vma_to_fileoffset_map
*
67 vma_map_add(struct vma_to_fileoffset_map
*map
, unsigned int vma
,
68 unsigned int size
, unsigned int offset
, unsigned int guard_ptr
,
69 unsigned int guard_val
)
71 struct vma_to_fileoffset_map
*new =
72 kzalloc(sizeof(struct vma_to_fileoffset_map
), GFP_KERNEL
);
74 printk(KERN_ERR
"SPU_PROF: %s, line %d: malloc failed\n",
75 __FUNCTION__
, __LINE__
);
84 new->guard_ptr
= guard_ptr
;
85 new->guard_val
= guard_val
;
91 /* Parse SPE ELF header and generate a list of vma_maps.
92 * A pointer to the first vma_map in the generated list
93 * of vma_maps is returned. */
94 struct vma_to_fileoffset_map
*create_vma_map(const struct spu
*aSpu
,
95 unsigned long spu_elf_start
)
97 static const unsigned char expected
[EI_PAD
] = {
102 [EI_CLASS
] = ELFCLASS32
,
103 [EI_DATA
] = ELFDATA2MSB
,
104 [EI_VERSION
] = EV_CURRENT
,
105 [EI_OSABI
] = ELFOSABI_NONE
109 struct vma_to_fileoffset_map
*map
= NULL
;
110 struct spu_overlay_info ovly
;
111 unsigned int overlay_tbl_offset
= -1;
112 unsigned long phdr_start
, shdr_start
;
115 Elf32_Shdr shdr
, shdr_str
;
120 unsigned int ovly_table_sym
= 0;
121 unsigned int ovly_buf_table_sym
= 0;
122 unsigned int ovly_table_end_sym
= 0;
123 unsigned int ovly_buf_table_end_sym
= 0;
124 unsigned long ovly_table
;
125 unsigned int n_ovlys
;
127 /* Get and validate ELF header. */
129 if (copy_from_user(&ehdr
, (void *) spu_elf_start
, sizeof (ehdr
)))
132 if (memcmp(ehdr
.e_ident
, expected
, EI_PAD
) != 0) {
133 printk(KERN_ERR
"SPU_PROF: "
134 "%s, line %d: Unexpected e_ident parsing SPU ELF\n",
135 __FUNCTION__
, __LINE__
);
138 if (ehdr
.e_machine
!= EM_SPU
) {
139 printk(KERN_ERR
"SPU_PROF: "
140 "%s, line %d: Unexpected e_machine parsing SPU ELF\n",
141 __FUNCTION__
, __LINE__
);
144 if (ehdr
.e_type
!= ET_EXEC
) {
145 printk(KERN_ERR
"SPU_PROF: "
146 "%s, line %d: Unexpected e_type parsing SPU ELF\n",
147 __FUNCTION__
, __LINE__
);
150 phdr_start
= spu_elf_start
+ ehdr
.e_phoff
;
151 shdr_start
= spu_elf_start
+ ehdr
.e_shoff
;
153 /* Traverse program headers. */
154 for (i
= 0; i
< ehdr
.e_phnum
; i
++) {
155 if (copy_from_user(&phdr
,
156 (void *) (phdr_start
+ i
* sizeof(phdr
)),
160 if (phdr
.p_type
!= PT_LOAD
)
162 if (phdr
.p_flags
& (1 << 27))
165 map
= vma_map_add(map
, phdr
.p_vaddr
, phdr
.p_memsz
,
166 phdr
.p_offset
, 0, 0);
171 pr_debug("SPU_PROF: Created non-overlay maps\n");
172 /* Traverse section table and search for overlay-related symbols. */
173 for (i
= 0; i
< ehdr
.e_shnum
; i
++) {
174 if (copy_from_user(&shdr
,
175 (void *) (shdr_start
+ i
* sizeof(shdr
)),
179 if (shdr
.sh_type
!= SHT_SYMTAB
)
181 if (shdr
.sh_entsize
!= sizeof (sym
))
184 if (copy_from_user(&shdr_str
,
185 (void *) (shdr_start
+ shdr
.sh_link
*
190 if (shdr_str
.sh_type
!= SHT_STRTAB
)
193 for (j
= 0; j
< shdr
.sh_size
/ sizeof (sym
); j
++) {
194 if (copy_from_user(&sym
, (void *) (spu_elf_start
+
200 if (copy_from_user(name
, (void *)
201 (spu_elf_start
+ shdr_str
.sh_offset
+
206 if (memcmp(name
, "_ovly_table", 12) == 0)
207 ovly_table_sym
= sym
.st_value
;
208 if (memcmp(name
, "_ovly_buf_table", 16) == 0)
209 ovly_buf_table_sym
= sym
.st_value
;
210 if (memcmp(name
, "_ovly_table_end", 16) == 0)
211 ovly_table_end_sym
= sym
.st_value
;
212 if (memcmp(name
, "_ovly_buf_table_end", 20) == 0)
213 ovly_buf_table_end_sym
= sym
.st_value
;
217 /* If we don't have overlays, we're done. */
218 if (ovly_table_sym
== 0 || ovly_buf_table_sym
== 0
219 || ovly_table_end_sym
== 0 || ovly_buf_table_end_sym
== 0) {
220 pr_debug("SPU_PROF: No overlay table found\n");
223 pr_debug("SPU_PROF: Overlay table found\n");
226 /* The _ovly_table symbol represents a table with one entry
227 * per overlay section. The _ovly_buf_table symbol represents
228 * a table with one entry per overlay region.
229 * The struct spu_overlay_info gives the structure of the _ovly_table
230 * entries. The structure of _ovly_table_buf is simply one
231 * u32 word per entry.
233 overlay_tbl_offset
= vma_map_lookup(map
, ovly_table_sym
,
235 if (overlay_tbl_offset
< 0) {
236 printk(KERN_ERR
"SPU_PROF: "
237 "%s, line %d: Error finding SPU overlay table\n",
238 __FUNCTION__
, __LINE__
);
241 ovly_table
= spu_elf_start
+ overlay_tbl_offset
;
243 n_ovlys
= (ovly_table_end_sym
-
244 ovly_table_sym
) / sizeof (ovly
);
246 /* Traverse overlay table. */
247 for (i
= 0; i
< n_ovlys
; i
++) {
248 if (copy_from_user(&ovly
, (void *)
249 (ovly_table
+ i
* sizeof (ovly
)),
253 /* The ovly.vma/size/offset arguments are analogous to the same
254 * arguments used above for non-overlay maps. The final two
255 * args are referred to as the guard pointer and the guard
257 * The guard pointer is an entry in the _ovly_buf_table,
258 * computed using ovly.buf as the index into the table. Since
259 * ovly.buf values begin at '1' to reference the first (or 0th)
260 * entry in the _ovly_buf_table, the computation subtracts 1
262 * The guard value is stored in the _ovly_buf_table entry and
263 * is an index (starting at 1) back to the _ovly_table entry
264 * that is pointing at this _ovly_buf_table entry. So, for
265 * example, for an overlay scenario with one overlay segment
266 * and two overlay sections:
267 * - Section 1 points to the first entry of the
268 * _ovly_buf_table, which contains a guard value
269 * of '1', referencing the first (index=0) entry of
271 * - Section 2 points to the second entry of the
272 * _ovly_buf_table, which contains a guard value
273 * of '2', referencing the second (index=1) entry of
276 map
= vma_map_add(map
, ovly
.vma
, ovly
.size
, ovly
.offset
,
277 ovly_buf_table_sym
+ (ovly
.buf
-1) * 4, i
+1);