1 // SPDX-License-Identifier: GPL-2.0
3 * cacheinfo support - processor cache information via sysfs
5 * Based on arch/x86/kernel/cpu/intel_cacheinfo.c
6 * Author: Sudeep Holla <sudeep.holla@arm.com>
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
10 #include <linux/acpi.h>
11 #include <linux/bitops.h>
12 #include <linux/cacheinfo.h>
13 #include <linux/compiler.h>
14 #include <linux/cpu.h>
15 #include <linux/device.h>
16 #include <linux/init.h>
18 #include <linux/sched.h>
19 #include <linux/slab.h>
20 #include <linux/smp.h>
21 #include <linux/sysfs.h>
23 /* pointer to per cpu cacheinfo */
24 static DEFINE_PER_CPU(struct cpu_cacheinfo
, ci_cpu_cacheinfo
);
25 #define ci_cacheinfo(cpu) (&per_cpu(ci_cpu_cacheinfo, cpu))
26 #define cache_leaves(cpu) (ci_cacheinfo(cpu)->num_leaves)
27 #define per_cpu_cacheinfo(cpu) (ci_cacheinfo(cpu)->info_list)
28 #define per_cpu_cacheinfo_idx(cpu, idx) \
29 (per_cpu_cacheinfo(cpu) + (idx))
31 /* Set if no cache information is found in DT/ACPI. */
32 static bool use_arch_info
;
34 struct cpu_cacheinfo
*get_cpu_cacheinfo(unsigned int cpu
)
36 return ci_cacheinfo(cpu
);
39 static inline bool cache_leaves_are_shared(struct cacheinfo
*this_leaf
,
40 struct cacheinfo
*sib_leaf
)
43 * For non DT/ACPI systems, assume unique level 1 caches,
44 * system-wide shared caches for all other levels.
46 if (!(IS_ENABLED(CONFIG_OF
) || IS_ENABLED(CONFIG_ACPI
)) ||
48 return (this_leaf
->level
!= 1) && (sib_leaf
->level
!= 1);
50 if ((sib_leaf
->attributes
& CACHE_ID
) &&
51 (this_leaf
->attributes
& CACHE_ID
))
52 return sib_leaf
->id
== this_leaf
->id
;
54 return sib_leaf
->fw_token
== this_leaf
->fw_token
;
57 bool last_level_cache_is_valid(unsigned int cpu
)
59 struct cacheinfo
*llc
;
61 if (!cache_leaves(cpu
))
64 llc
= per_cpu_cacheinfo_idx(cpu
, cache_leaves(cpu
) - 1);
66 return (llc
->attributes
& CACHE_ID
) || !!llc
->fw_token
;
70 bool last_level_cache_is_shared(unsigned int cpu_x
, unsigned int cpu_y
)
72 struct cacheinfo
*llc_x
, *llc_y
;
74 if (!last_level_cache_is_valid(cpu_x
) ||
75 !last_level_cache_is_valid(cpu_y
))
78 llc_x
= per_cpu_cacheinfo_idx(cpu_x
, cache_leaves(cpu_x
) - 1);
79 llc_y
= per_cpu_cacheinfo_idx(cpu_y
, cache_leaves(cpu_y
) - 1);
81 return cache_leaves_are_shared(llc_x
, llc_y
);
86 static bool of_check_cache_nodes(struct device_node
*np
);
88 /* OF properties to query for a given cache type */
89 struct cache_type_info
{
90 const char *size_prop
;
91 const char *line_size_props
[2];
92 const char *nr_sets_prop
;
95 static const struct cache_type_info cache_type_info
[] = {
97 .size_prop
= "cache-size",
98 .line_size_props
= { "cache-line-size",
99 "cache-block-size", },
100 .nr_sets_prop
= "cache-sets",
102 .size_prop
= "i-cache-size",
103 .line_size_props
= { "i-cache-line-size",
104 "i-cache-block-size", },
105 .nr_sets_prop
= "i-cache-sets",
107 .size_prop
= "d-cache-size",
108 .line_size_props
= { "d-cache-line-size",
109 "d-cache-block-size", },
110 .nr_sets_prop
= "d-cache-sets",
114 static inline int get_cacheinfo_idx(enum cache_type type
)
116 if (type
== CACHE_TYPE_UNIFIED
)
121 static void cache_size(struct cacheinfo
*this_leaf
, struct device_node
*np
)
123 const char *propname
;
126 ct_idx
= get_cacheinfo_idx(this_leaf
->type
);
127 propname
= cache_type_info
[ct_idx
].size_prop
;
129 of_property_read_u32(np
, propname
, &this_leaf
->size
);
132 /* not cache_line_size() because that's a macro in include/linux/cache.h */
133 static void cache_get_line_size(struct cacheinfo
*this_leaf
,
134 struct device_node
*np
)
138 ct_idx
= get_cacheinfo_idx(this_leaf
->type
);
139 lim
= ARRAY_SIZE(cache_type_info
[ct_idx
].line_size_props
);
141 for (i
= 0; i
< lim
; i
++) {
144 const char *propname
;
146 propname
= cache_type_info
[ct_idx
].line_size_props
[i
];
147 ret
= of_property_read_u32(np
, propname
, &line_size
);
149 this_leaf
->coherency_line_size
= line_size
;
155 static void cache_nr_sets(struct cacheinfo
*this_leaf
, struct device_node
*np
)
157 const char *propname
;
160 ct_idx
= get_cacheinfo_idx(this_leaf
->type
);
161 propname
= cache_type_info
[ct_idx
].nr_sets_prop
;
163 of_property_read_u32(np
, propname
, &this_leaf
->number_of_sets
);
166 static void cache_associativity(struct cacheinfo
*this_leaf
)
168 unsigned int line_size
= this_leaf
->coherency_line_size
;
169 unsigned int nr_sets
= this_leaf
->number_of_sets
;
170 unsigned int size
= this_leaf
->size
;
173 * If the cache is fully associative, there is no need to
174 * check the other properties.
176 if (!(nr_sets
== 1) && (nr_sets
> 0 && size
> 0 && line_size
> 0))
177 this_leaf
->ways_of_associativity
= (size
/ nr_sets
) / line_size
;
180 static bool cache_node_is_unified(struct cacheinfo
*this_leaf
,
181 struct device_node
*np
)
183 return of_property_read_bool(np
, "cache-unified");
186 static void cache_of_set_props(struct cacheinfo
*this_leaf
,
187 struct device_node
*np
)
190 * init_cache_level must setup the cache level correctly
191 * overriding the architecturally specified levels, so
192 * if type is NONE at this stage, it should be unified
194 if (this_leaf
->type
== CACHE_TYPE_NOCACHE
&&
195 cache_node_is_unified(this_leaf
, np
))
196 this_leaf
->type
= CACHE_TYPE_UNIFIED
;
197 cache_size(this_leaf
, np
);
198 cache_get_line_size(this_leaf
, np
);
199 cache_nr_sets(this_leaf
, np
);
200 cache_associativity(this_leaf
);
203 static int cache_setup_of_node(unsigned int cpu
)
205 struct cacheinfo
*this_leaf
;
206 unsigned int index
= 0;
208 struct device_node
*np
__free(device_node
) = of_cpu_device_node_get(cpu
);
210 pr_err("Failed to find cpu%d device node\n", cpu
);
214 if (!of_check_cache_nodes(np
)) {
218 while (index
< cache_leaves(cpu
)) {
219 this_leaf
= per_cpu_cacheinfo_idx(cpu
, index
);
220 if (this_leaf
->level
!= 1) {
221 struct device_node
*prev
__free(device_node
) = np
;
222 np
= of_find_next_cache_node(np
);
226 cache_of_set_props(this_leaf
, np
);
227 this_leaf
->fw_token
= np
;
231 if (index
!= cache_leaves(cpu
)) /* not all OF nodes populated */
237 static bool of_check_cache_nodes(struct device_node
*np
)
239 if (of_property_present(np
, "cache-size") ||
240 of_property_present(np
, "i-cache-size") ||
241 of_property_present(np
, "d-cache-size") ||
242 of_property_present(np
, "cache-unified"))
245 struct device_node
*next
__free(device_node
) = of_find_next_cache_node(np
);
253 static int of_count_cache_leaves(struct device_node
*np
)
255 unsigned int leaves
= 0;
257 if (of_property_read_bool(np
, "cache-size"))
259 if (of_property_read_bool(np
, "i-cache-size"))
261 if (of_property_read_bool(np
, "d-cache-size"))
265 /* The '[i-|d-|]cache-size' property is required, but
266 * if absent, fallback on the 'cache-unified' property.
268 if (of_property_read_bool(np
, "cache-unified"))
277 int init_of_cache_level(unsigned int cpu
)
279 struct cpu_cacheinfo
*this_cpu_ci
= get_cpu_cacheinfo(cpu
);
280 struct device_node
*np
__free(device_node
) = of_cpu_device_node_get(cpu
);
281 unsigned int levels
= 0, leaves
, level
;
283 if (!of_check_cache_nodes(np
)) {
287 leaves
= of_count_cache_leaves(np
);
292 struct device_node
*prev
__free(device_node
) = np
;
293 np
= of_find_next_cache_node(np
);
297 if (!of_device_is_compatible(np
, "cache"))
299 if (of_property_read_u32(np
, "cache-level", &level
))
304 leaves
+= of_count_cache_leaves(np
);
308 this_cpu_ci
->num_levels
= levels
;
309 this_cpu_ci
->num_leaves
= leaves
;
315 static inline int cache_setup_of_node(unsigned int cpu
) { return 0; }
316 int init_of_cache_level(unsigned int cpu
) { return 0; }
319 int __weak
cache_setup_acpi(unsigned int cpu
)
324 unsigned int coherency_max_size
;
326 static int cache_setup_properties(unsigned int cpu
)
330 if (of_have_populated_dt())
331 ret
= cache_setup_of_node(cpu
);
332 else if (!acpi_disabled
)
333 ret
= cache_setup_acpi(cpu
);
335 // Assume there is no cache information available in DT/ACPI from now.
336 if (ret
&& use_arch_cache_info())
337 use_arch_info
= true;
342 static int cache_shared_cpu_map_setup(unsigned int cpu
)
344 struct cpu_cacheinfo
*this_cpu_ci
= get_cpu_cacheinfo(cpu
);
345 struct cacheinfo
*this_leaf
, *sib_leaf
;
346 unsigned int index
, sib_index
;
349 if (this_cpu_ci
->cpu_map_populated
)
353 * skip setting up cache properties if LLC is valid, just need
354 * to update the shared cpu_map if the cache attributes were
355 * populated early before all the cpus are brought online
357 if (!last_level_cache_is_valid(cpu
) && !use_arch_info
) {
358 ret
= cache_setup_properties(cpu
);
363 for (index
= 0; index
< cache_leaves(cpu
); index
++) {
366 this_leaf
= per_cpu_cacheinfo_idx(cpu
, index
);
368 cpumask_set_cpu(cpu
, &this_leaf
->shared_cpu_map
);
369 for_each_online_cpu(i
) {
370 struct cpu_cacheinfo
*sib_cpu_ci
= get_cpu_cacheinfo(i
);
372 if (i
== cpu
|| !sib_cpu_ci
->info_list
)
373 continue;/* skip if itself or no cacheinfo */
374 for (sib_index
= 0; sib_index
< cache_leaves(i
); sib_index
++) {
375 sib_leaf
= per_cpu_cacheinfo_idx(i
, sib_index
);
378 * Comparing cache IDs only makes sense if the leaves
379 * belong to the same cache level of same type. Skip
380 * the check if level and type do not match.
382 if (sib_leaf
->level
!= this_leaf
->level
||
383 sib_leaf
->type
!= this_leaf
->type
)
386 if (cache_leaves_are_shared(this_leaf
, sib_leaf
)) {
387 cpumask_set_cpu(cpu
, &sib_leaf
->shared_cpu_map
);
388 cpumask_set_cpu(i
, &this_leaf
->shared_cpu_map
);
393 /* record the maximum cache line size */
394 if (this_leaf
->coherency_line_size
> coherency_max_size
)
395 coherency_max_size
= this_leaf
->coherency_line_size
;
398 /* shared_cpu_map is now populated for the cpu */
399 this_cpu_ci
->cpu_map_populated
= true;
403 static void cache_shared_cpu_map_remove(unsigned int cpu
)
405 struct cpu_cacheinfo
*this_cpu_ci
= get_cpu_cacheinfo(cpu
);
406 struct cacheinfo
*this_leaf
, *sib_leaf
;
407 unsigned int sibling
, index
, sib_index
;
409 for (index
= 0; index
< cache_leaves(cpu
); index
++) {
410 this_leaf
= per_cpu_cacheinfo_idx(cpu
, index
);
411 for_each_cpu(sibling
, &this_leaf
->shared_cpu_map
) {
412 struct cpu_cacheinfo
*sib_cpu_ci
=
413 get_cpu_cacheinfo(sibling
);
415 if (sibling
== cpu
|| !sib_cpu_ci
->info_list
)
416 continue;/* skip if itself or no cacheinfo */
418 for (sib_index
= 0; sib_index
< cache_leaves(sibling
); sib_index
++) {
419 sib_leaf
= per_cpu_cacheinfo_idx(sibling
, sib_index
);
422 * Comparing cache IDs only makes sense if the leaves
423 * belong to the same cache level of same type. Skip
424 * the check if level and type do not match.
426 if (sib_leaf
->level
!= this_leaf
->level
||
427 sib_leaf
->type
!= this_leaf
->type
)
430 if (cache_leaves_are_shared(this_leaf
, sib_leaf
)) {
431 cpumask_clear_cpu(cpu
, &sib_leaf
->shared_cpu_map
);
432 cpumask_clear_cpu(sibling
, &this_leaf
->shared_cpu_map
);
439 /* cpu is no longer populated in the shared map */
440 this_cpu_ci
->cpu_map_populated
= false;
443 static void free_cache_attributes(unsigned int cpu
)
445 if (!per_cpu_cacheinfo(cpu
))
448 cache_shared_cpu_map_remove(cpu
);
451 int __weak
early_cache_level(unsigned int cpu
)
456 int __weak
init_cache_level(unsigned int cpu
)
461 int __weak
populate_cache_leaves(unsigned int cpu
)
467 int allocate_cache_info(int cpu
)
469 per_cpu_cacheinfo(cpu
) = kcalloc(cache_leaves(cpu
),
470 sizeof(struct cacheinfo
), GFP_ATOMIC
);
471 if (!per_cpu_cacheinfo(cpu
)) {
472 cache_leaves(cpu
) = 0;
479 int fetch_cache_info(unsigned int cpu
)
481 struct cpu_cacheinfo
*this_cpu_ci
= get_cpu_cacheinfo(cpu
);
482 unsigned int levels
= 0, split_levels
= 0;
486 ret
= init_of_cache_level(cpu
);
488 ret
= acpi_get_cache_info(cpu
, &levels
, &split_levels
);
490 this_cpu_ci
->num_levels
= levels
;
493 * - there cannot be any split caches (data/instruction)
494 * above a unified cache
495 * - data/instruction caches come by pair
497 this_cpu_ci
->num_leaves
= levels
+ split_levels
;
501 if (ret
|| !cache_leaves(cpu
)) {
502 ret
= early_cache_level(cpu
);
506 if (!cache_leaves(cpu
))
509 this_cpu_ci
->early_ci_levels
= true;
512 return allocate_cache_info(cpu
);
515 static inline int init_level_allocate_ci(unsigned int cpu
)
517 unsigned int early_leaves
= cache_leaves(cpu
);
519 /* Since early initialization/allocation of the cacheinfo is allowed
520 * via fetch_cache_info() and this also gets called as CPU hotplug
521 * callbacks via cacheinfo_cpu_online, the init/alloc can be skipped
522 * as it will happen only once (the cacheinfo memory is never freed).
523 * Just populate the cacheinfo. However, if the cacheinfo has been
524 * allocated early through the arch-specific early_cache_level() call,
525 * there is a chance the info is wrong (this can happen on arm64). In
526 * that case, call init_cache_level() anyway to give the arch-specific
527 * code a chance to make things right.
529 if (per_cpu_cacheinfo(cpu
) && !ci_cacheinfo(cpu
)->early_ci_levels
)
532 if (init_cache_level(cpu
) || !cache_leaves(cpu
))
536 * Now that we have properly initialized the cache level info, make
537 * sure we don't try to do that again the next time we are called
538 * (e.g. as CPU hotplug callbacks).
540 ci_cacheinfo(cpu
)->early_ci_levels
= false;
542 if (cache_leaves(cpu
) <= early_leaves
)
545 kfree(per_cpu_cacheinfo(cpu
));
546 return allocate_cache_info(cpu
);
549 int detect_cache_attributes(unsigned int cpu
)
553 ret
= init_level_allocate_ci(cpu
);
558 * If LLC is valid the cache leaves were already populated so just go to
559 * update the cpu map.
561 if (!last_level_cache_is_valid(cpu
)) {
563 * populate_cache_leaves() may completely setup the cache leaves and
564 * shared_cpu_map or it may leave it partially setup.
566 ret
= populate_cache_leaves(cpu
);
572 * For systems using DT for cache hierarchy, fw_token
573 * and shared_cpu_map will be set up here only if they are
574 * not populated already
576 ret
= cache_shared_cpu_map_setup(cpu
);
578 pr_warn("Unable to detect cache hierarchy for CPU %d\n", cpu
);
585 free_cache_attributes(cpu
);
589 /* pointer to cpuX/cache device */
590 static DEFINE_PER_CPU(struct device
*, ci_cache_dev
);
591 #define per_cpu_cache_dev(cpu) (per_cpu(ci_cache_dev, cpu))
593 static cpumask_t cache_dev_map
;
595 /* pointer to array of devices for cpuX/cache/indexY */
596 static DEFINE_PER_CPU(struct device
**, ci_index_dev
);
597 #define per_cpu_index_dev(cpu) (per_cpu(ci_index_dev, cpu))
598 #define per_cache_index_dev(cpu, idx) ((per_cpu_index_dev(cpu))[idx])
600 #define show_one(file_name, object) \
601 static ssize_t file_name##_show(struct device *dev, \
602 struct device_attribute *attr, char *buf) \
604 struct cacheinfo *this_leaf = dev_get_drvdata(dev); \
605 return sysfs_emit(buf, "%u\n", this_leaf->object); \
609 show_one(level
, level
);
610 show_one(coherency_line_size
, coherency_line_size
);
611 show_one(number_of_sets
, number_of_sets
);
612 show_one(physical_line_partition
, physical_line_partition
);
613 show_one(ways_of_associativity
, ways_of_associativity
);
615 static ssize_t
size_show(struct device
*dev
,
616 struct device_attribute
*attr
, char *buf
)
618 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
620 return sysfs_emit(buf
, "%uK\n", this_leaf
->size
>> 10);
623 static ssize_t
shared_cpu_map_show(struct device
*dev
,
624 struct device_attribute
*attr
, char *buf
)
626 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
627 const struct cpumask
*mask
= &this_leaf
->shared_cpu_map
;
629 return sysfs_emit(buf
, "%*pb\n", nr_cpu_ids
, mask
);
632 static ssize_t
shared_cpu_list_show(struct device
*dev
,
633 struct device_attribute
*attr
, char *buf
)
635 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
636 const struct cpumask
*mask
= &this_leaf
->shared_cpu_map
;
638 return sysfs_emit(buf
, "%*pbl\n", nr_cpu_ids
, mask
);
641 static ssize_t
type_show(struct device
*dev
,
642 struct device_attribute
*attr
, char *buf
)
644 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
647 switch (this_leaf
->type
) {
648 case CACHE_TYPE_DATA
:
651 case CACHE_TYPE_INST
:
652 output
= "Instruction";
654 case CACHE_TYPE_UNIFIED
:
661 return sysfs_emit(buf
, "%s\n", output
);
664 static ssize_t
allocation_policy_show(struct device
*dev
,
665 struct device_attribute
*attr
, char *buf
)
667 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
668 unsigned int ci_attr
= this_leaf
->attributes
;
671 if ((ci_attr
& CACHE_READ_ALLOCATE
) && (ci_attr
& CACHE_WRITE_ALLOCATE
))
672 output
= "ReadWriteAllocate";
673 else if (ci_attr
& CACHE_READ_ALLOCATE
)
674 output
= "ReadAllocate";
675 else if (ci_attr
& CACHE_WRITE_ALLOCATE
)
676 output
= "WriteAllocate";
680 return sysfs_emit(buf
, "%s\n", output
);
683 static ssize_t
write_policy_show(struct device
*dev
,
684 struct device_attribute
*attr
, char *buf
)
686 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
687 unsigned int ci_attr
= this_leaf
->attributes
;
690 if (ci_attr
& CACHE_WRITE_THROUGH
)
691 n
= sysfs_emit(buf
, "WriteThrough\n");
692 else if (ci_attr
& CACHE_WRITE_BACK
)
693 n
= sysfs_emit(buf
, "WriteBack\n");
697 static DEVICE_ATTR_RO(id
);
698 static DEVICE_ATTR_RO(level
);
699 static DEVICE_ATTR_RO(type
);
700 static DEVICE_ATTR_RO(coherency_line_size
);
701 static DEVICE_ATTR_RO(ways_of_associativity
);
702 static DEVICE_ATTR_RO(number_of_sets
);
703 static DEVICE_ATTR_RO(size
);
704 static DEVICE_ATTR_RO(allocation_policy
);
705 static DEVICE_ATTR_RO(write_policy
);
706 static DEVICE_ATTR_RO(shared_cpu_map
);
707 static DEVICE_ATTR_RO(shared_cpu_list
);
708 static DEVICE_ATTR_RO(physical_line_partition
);
710 static struct attribute
*cache_default_attrs
[] = {
713 &dev_attr_level
.attr
,
714 &dev_attr_shared_cpu_map
.attr
,
715 &dev_attr_shared_cpu_list
.attr
,
716 &dev_attr_coherency_line_size
.attr
,
717 &dev_attr_ways_of_associativity
.attr
,
718 &dev_attr_number_of_sets
.attr
,
720 &dev_attr_allocation_policy
.attr
,
721 &dev_attr_write_policy
.attr
,
722 &dev_attr_physical_line_partition
.attr
,
727 cache_default_attrs_is_visible(struct kobject
*kobj
,
728 struct attribute
*attr
, int unused
)
730 struct device
*dev
= kobj_to_dev(kobj
);
731 struct cacheinfo
*this_leaf
= dev_get_drvdata(dev
);
732 const struct cpumask
*mask
= &this_leaf
->shared_cpu_map
;
733 umode_t mode
= attr
->mode
;
735 if ((attr
== &dev_attr_id
.attr
) && (this_leaf
->attributes
& CACHE_ID
))
737 if ((attr
== &dev_attr_type
.attr
) && this_leaf
->type
)
739 if ((attr
== &dev_attr_level
.attr
) && this_leaf
->level
)
741 if ((attr
== &dev_attr_shared_cpu_map
.attr
) && !cpumask_empty(mask
))
743 if ((attr
== &dev_attr_shared_cpu_list
.attr
) && !cpumask_empty(mask
))
745 if ((attr
== &dev_attr_coherency_line_size
.attr
) &&
746 this_leaf
->coherency_line_size
)
748 if ((attr
== &dev_attr_ways_of_associativity
.attr
) &&
749 this_leaf
->size
) /* allow 0 = full associativity */
751 if ((attr
== &dev_attr_number_of_sets
.attr
) &&
752 this_leaf
->number_of_sets
)
754 if ((attr
== &dev_attr_size
.attr
) && this_leaf
->size
)
756 if ((attr
== &dev_attr_write_policy
.attr
) &&
757 (this_leaf
->attributes
& CACHE_WRITE_POLICY_MASK
))
759 if ((attr
== &dev_attr_allocation_policy
.attr
) &&
760 (this_leaf
->attributes
& CACHE_ALLOCATE_POLICY_MASK
))
762 if ((attr
== &dev_attr_physical_line_partition
.attr
) &&
763 this_leaf
->physical_line_partition
)
769 static const struct attribute_group cache_default_group
= {
770 .attrs
= cache_default_attrs
,
771 .is_visible
= cache_default_attrs_is_visible
,
774 static const struct attribute_group
*cache_default_groups
[] = {
775 &cache_default_group
,
779 static const struct attribute_group
*cache_private_groups
[] = {
780 &cache_default_group
,
781 NULL
, /* Place holder for private group */
785 const struct attribute_group
*
786 __weak
cache_get_priv_group(struct cacheinfo
*this_leaf
)
791 static const struct attribute_group
**
792 cache_get_attribute_groups(struct cacheinfo
*this_leaf
)
794 const struct attribute_group
*priv_group
=
795 cache_get_priv_group(this_leaf
);
798 return cache_default_groups
;
800 if (!cache_private_groups
[1])
801 cache_private_groups
[1] = priv_group
;
803 return cache_private_groups
;
806 /* Add/Remove cache interface for CPU device */
807 static void cpu_cache_sysfs_exit(unsigned int cpu
)
810 struct device
*ci_dev
;
812 if (per_cpu_index_dev(cpu
)) {
813 for (i
= 0; i
< cache_leaves(cpu
); i
++) {
814 ci_dev
= per_cache_index_dev(cpu
, i
);
817 device_unregister(ci_dev
);
819 kfree(per_cpu_index_dev(cpu
));
820 per_cpu_index_dev(cpu
) = NULL
;
822 device_unregister(per_cpu_cache_dev(cpu
));
823 per_cpu_cache_dev(cpu
) = NULL
;
826 static int cpu_cache_sysfs_init(unsigned int cpu
)
828 struct device
*dev
= get_cpu_device(cpu
);
830 if (per_cpu_cacheinfo(cpu
) == NULL
)
833 per_cpu_cache_dev(cpu
) = cpu_device_create(dev
, NULL
, NULL
, "cache");
834 if (IS_ERR(per_cpu_cache_dev(cpu
)))
835 return PTR_ERR(per_cpu_cache_dev(cpu
));
837 /* Allocate all required memory */
838 per_cpu_index_dev(cpu
) = kcalloc(cache_leaves(cpu
),
839 sizeof(struct device
*), GFP_KERNEL
);
840 if (unlikely(per_cpu_index_dev(cpu
) == NULL
))
846 cpu_cache_sysfs_exit(cpu
);
850 static int cache_add_dev(unsigned int cpu
)
854 struct device
*ci_dev
, *parent
;
855 struct cacheinfo
*this_leaf
;
856 const struct attribute_group
**cache_groups
;
858 rc
= cpu_cache_sysfs_init(cpu
);
859 if (unlikely(rc
< 0))
862 parent
= per_cpu_cache_dev(cpu
);
863 for (i
= 0; i
< cache_leaves(cpu
); i
++) {
864 this_leaf
= per_cpu_cacheinfo_idx(cpu
, i
);
865 if (this_leaf
->disable_sysfs
)
867 if (this_leaf
->type
== CACHE_TYPE_NOCACHE
)
869 cache_groups
= cache_get_attribute_groups(this_leaf
);
870 ci_dev
= cpu_device_create(parent
, this_leaf
, cache_groups
,
872 if (IS_ERR(ci_dev
)) {
873 rc
= PTR_ERR(ci_dev
);
876 per_cache_index_dev(cpu
, i
) = ci_dev
;
878 cpumask_set_cpu(cpu
, &cache_dev_map
);
882 cpu_cache_sysfs_exit(cpu
);
886 static unsigned int cpu_map_shared_cache(bool online
, unsigned int cpu
,
889 struct cacheinfo
*llc
, *sib_llc
;
890 unsigned int sibling
;
892 if (!last_level_cache_is_valid(cpu
))
895 llc
= per_cpu_cacheinfo_idx(cpu
, cache_leaves(cpu
) - 1);
897 if (llc
->type
!= CACHE_TYPE_DATA
&& llc
->type
!= CACHE_TYPE_UNIFIED
)
901 *map
= &llc
->shared_cpu_map
;
902 return cpumask_weight(*map
);
905 /* shared_cpu_map of offlined CPU will be cleared, so use sibling map */
906 for_each_cpu(sibling
, &llc
->shared_cpu_map
) {
907 if (sibling
== cpu
|| !last_level_cache_is_valid(sibling
))
909 sib_llc
= per_cpu_cacheinfo_idx(sibling
, cache_leaves(sibling
) - 1);
910 *map
= &sib_llc
->shared_cpu_map
;
911 return cpumask_weight(*map
);
918 * Calculate the size of the per-CPU data cache slice. This can be
919 * used to estimate the size of the data cache slice that can be used
920 * by one CPU under ideal circumstances. UNIFIED caches are counted
921 * in addition to DATA caches. So, please consider code cache usage
922 * when use the result.
924 * Because the cache inclusive/non-inclusive information isn't
925 * available, we just use the size of the per-CPU slice of LLC to make
926 * the result more predictable across architectures.
928 static void update_per_cpu_data_slice_size_cpu(unsigned int cpu
)
930 struct cpu_cacheinfo
*ci
;
931 struct cacheinfo
*llc
;
932 unsigned int nr_shared
;
934 if (!last_level_cache_is_valid(cpu
))
937 ci
= ci_cacheinfo(cpu
);
938 llc
= per_cpu_cacheinfo_idx(cpu
, cache_leaves(cpu
) - 1);
940 if (llc
->type
!= CACHE_TYPE_DATA
&& llc
->type
!= CACHE_TYPE_UNIFIED
)
943 nr_shared
= cpumask_weight(&llc
->shared_cpu_map
);
945 ci
->per_cpu_data_slice_size
= llc
->size
/ nr_shared
;
948 static void update_per_cpu_data_slice_size(bool cpu_online
, unsigned int cpu
,
953 for_each_cpu(icpu
, cpu_map
) {
954 if (!cpu_online
&& icpu
== cpu
)
956 update_per_cpu_data_slice_size_cpu(icpu
);
957 setup_pcp_cacheinfo(icpu
);
961 static int cacheinfo_cpu_online(unsigned int cpu
)
963 int rc
= detect_cache_attributes(cpu
);
968 rc
= cache_add_dev(cpu
);
971 if (cpu_map_shared_cache(true, cpu
, &cpu_map
))
972 update_per_cpu_data_slice_size(true, cpu
, cpu_map
);
975 free_cache_attributes(cpu
);
979 static int cacheinfo_cpu_pre_down(unsigned int cpu
)
982 unsigned int nr_shared
;
984 nr_shared
= cpu_map_shared_cache(false, cpu
, &cpu_map
);
985 if (cpumask_test_and_clear_cpu(cpu
, &cache_dev_map
))
986 cpu_cache_sysfs_exit(cpu
);
988 free_cache_attributes(cpu
);
990 update_per_cpu_data_slice_size(false, cpu
, cpu_map
);
994 static int __init
cacheinfo_sysfs_init(void)
996 return cpuhp_setup_state(CPUHP_AP_BASE_CACHEINFO_ONLINE
,
997 "base/cacheinfo:online",
998 cacheinfo_cpu_online
, cacheinfo_cpu_pre_down
);
1000 device_initcall(cacheinfo_sysfs_init
);