1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright(c) 2022 Intel Corporation. All rights reserved. */
4 #define TRACE_SYSTEM cxl
6 #if !defined(_CXL_EVENTS_H) || defined(TRACE_HEADER_MULTI_READ)
9 #include <linux/tracepoint.h>
10 #include <linux/pci.h>
11 #include <linux/unaligned.h>
17 #define CXL_RAS_UC_CACHE_DATA_PARITY BIT(0)
18 #define CXL_RAS_UC_CACHE_ADDR_PARITY BIT(1)
19 #define CXL_RAS_UC_CACHE_BE_PARITY BIT(2)
20 #define CXL_RAS_UC_CACHE_DATA_ECC BIT(3)
21 #define CXL_RAS_UC_MEM_DATA_PARITY BIT(4)
22 #define CXL_RAS_UC_MEM_ADDR_PARITY BIT(5)
23 #define CXL_RAS_UC_MEM_BE_PARITY BIT(6)
24 #define CXL_RAS_UC_MEM_DATA_ECC BIT(7)
25 #define CXL_RAS_UC_REINIT_THRESH BIT(8)
26 #define CXL_RAS_UC_RSVD_ENCODE BIT(9)
27 #define CXL_RAS_UC_POISON BIT(10)
28 #define CXL_RAS_UC_RECV_OVERFLOW BIT(11)
29 #define CXL_RAS_UC_INTERNAL_ERR BIT(14)
30 #define CXL_RAS_UC_IDE_TX_ERR BIT(15)
31 #define CXL_RAS_UC_IDE_RX_ERR BIT(16)
33 #define show_uc_errs(status) __print_flags(status, " | ", \
34 { CXL_RAS_UC_CACHE_DATA_PARITY, "Cache Data Parity Error" }, \
35 { CXL_RAS_UC_CACHE_ADDR_PARITY, "Cache Address Parity Error" }, \
36 { CXL_RAS_UC_CACHE_BE_PARITY, "Cache Byte Enable Parity Error" }, \
37 { CXL_RAS_UC_CACHE_DATA_ECC, "Cache Data ECC Error" }, \
38 { CXL_RAS_UC_MEM_DATA_PARITY, "Memory Data Parity Error" }, \
39 { CXL_RAS_UC_MEM_ADDR_PARITY, "Memory Address Parity Error" }, \
40 { CXL_RAS_UC_MEM_BE_PARITY, "Memory Byte Enable Parity Error" }, \
41 { CXL_RAS_UC_MEM_DATA_ECC, "Memory Data ECC Error" }, \
42 { CXL_RAS_UC_REINIT_THRESH, "REINIT Threshold Hit" }, \
43 { CXL_RAS_UC_RSVD_ENCODE, "Received Unrecognized Encoding" }, \
44 { CXL_RAS_UC_POISON, "Received Poison From Peer" }, \
45 { CXL_RAS_UC_RECV_OVERFLOW, "Receiver Overflow" }, \
46 { CXL_RAS_UC_INTERNAL_ERR, "Component Specific Error" }, \
47 { CXL_RAS_UC_IDE_TX_ERR, "IDE Tx Error" }, \
48 { CXL_RAS_UC_IDE_RX_ERR, "IDE Rx Error" } \
51 TRACE_EVENT(cxl_aer_uncorrectable_error
,
52 TP_PROTO(const struct cxl_memdev
*cxlmd
, u32 status
, u32 fe
, u32
*hl
),
53 TP_ARGS(cxlmd
, status
, fe
, hl
),
55 __string(memdev
, dev_name(&cxlmd
->dev
))
56 __string(host
, dev_name(cxlmd
->dev
.parent
))
59 __field(u32
, first_error
)
60 __array(u32
, header_log
, CXL_HEADERLOG_SIZE_U32
)
65 __entry
->serial
= cxlmd
->cxlds
->serial
;
66 __entry
->status
= status
;
67 __entry
->first_error
= fe
;
69 * Embed the 512B headerlog data for user app retrieval and
70 * parsing, but no need to print this in the trace buffer.
72 memcpy(__entry
->header_log
, hl
, CXL_HEADERLOG_SIZE
);
74 TP_printk("memdev=%s host=%s serial=%lld: status: '%s' first_error: '%s'",
75 __get_str(memdev
), __get_str(host
), __entry
->serial
,
76 show_uc_errs(__entry
->status
),
77 show_uc_errs(__entry
->first_error
)
81 #define CXL_RAS_CE_CACHE_DATA_ECC BIT(0)
82 #define CXL_RAS_CE_MEM_DATA_ECC BIT(1)
83 #define CXL_RAS_CE_CRC_THRESH BIT(2)
84 #define CLX_RAS_CE_RETRY_THRESH BIT(3)
85 #define CXL_RAS_CE_CACHE_POISON BIT(4)
86 #define CXL_RAS_CE_MEM_POISON BIT(5)
87 #define CXL_RAS_CE_PHYS_LAYER_ERR BIT(6)
89 #define show_ce_errs(status) __print_flags(status, " | ", \
90 { CXL_RAS_CE_CACHE_DATA_ECC, "Cache Data ECC Error" }, \
91 { CXL_RAS_CE_MEM_DATA_ECC, "Memory Data ECC Error" }, \
92 { CXL_RAS_CE_CRC_THRESH, "CRC Threshold Hit" }, \
93 { CLX_RAS_CE_RETRY_THRESH, "Retry Threshold" }, \
94 { CXL_RAS_CE_CACHE_POISON, "Received Cache Poison From Peer" }, \
95 { CXL_RAS_CE_MEM_POISON, "Received Memory Poison From Peer" }, \
96 { CXL_RAS_CE_PHYS_LAYER_ERR, "Received Error From Physical Layer" } \
99 TRACE_EVENT(cxl_aer_correctable_error
,
100 TP_PROTO(const struct cxl_memdev
*cxlmd
, u32 status
),
101 TP_ARGS(cxlmd
, status
),
103 __string(memdev
, dev_name(&cxlmd
->dev
))
104 __string(host
, dev_name(cxlmd
->dev
.parent
))
109 __assign_str(memdev
);
111 __entry
->serial
= cxlmd
->cxlds
->serial
;
112 __entry
->status
= status
;
114 TP_printk("memdev=%s host=%s serial=%lld: status: '%s'",
115 __get_str(memdev
), __get_str(host
), __entry
->serial
,
116 show_ce_errs(__entry
->status
)
120 #define cxl_event_log_type_str(type) \
121 __print_symbolic(type, \
122 { CXL_EVENT_TYPE_INFO, "Informational" }, \
123 { CXL_EVENT_TYPE_WARN, "Warning" }, \
124 { CXL_EVENT_TYPE_FAIL, "Failure" }, \
125 { CXL_EVENT_TYPE_FATAL, "Fatal" })
127 TRACE_EVENT(cxl_overflow
,
129 TP_PROTO(const struct cxl_memdev
*cxlmd
, enum cxl_event_log_type log
,
130 struct cxl_get_event_payload
*payload
),
132 TP_ARGS(cxlmd
, log
, payload
),
135 __string(memdev
, dev_name(&cxlmd
->dev
))
136 __string(host
, dev_name(cxlmd
->dev
.parent
))
139 __field(u64
, first_ts
)
140 __field(u64
, last_ts
)
145 __assign_str(memdev
);
147 __entry
->serial
= cxlmd
->cxlds
->serial
;
149 __entry
->count
= le16_to_cpu(payload
->overflow_err_count
);
150 __entry
->first_ts
= le64_to_cpu(payload
->first_overflow_timestamp
);
151 __entry
->last_ts
= le64_to_cpu(payload
->last_overflow_timestamp
);
154 TP_printk("memdev=%s host=%s serial=%lld: log=%s : %u records from %llu to %llu",
155 __get_str(memdev
), __get_str(host
), __entry
->serial
,
156 cxl_event_log_type_str(__entry
->log
), __entry
->count
,
157 __entry
->first_ts
, __entry
->last_ts
)
162 * Common Event Record Format
163 * CXL 3.0 section 8.2.9.2.1; Table 8-42
165 #define CXL_EVENT_RECORD_FLAG_PERMANENT BIT(2)
166 #define CXL_EVENT_RECORD_FLAG_MAINT_NEEDED BIT(3)
167 #define CXL_EVENT_RECORD_FLAG_PERF_DEGRADED BIT(4)
168 #define CXL_EVENT_RECORD_FLAG_HW_REPLACE BIT(5)
169 #define show_hdr_flags(flags) __print_flags(flags, " | ", \
170 { CXL_EVENT_RECORD_FLAG_PERMANENT, "PERMANENT_CONDITION" }, \
171 { CXL_EVENT_RECORD_FLAG_MAINT_NEEDED, "MAINTENANCE_NEEDED" }, \
172 { CXL_EVENT_RECORD_FLAG_PERF_DEGRADED, "PERFORMANCE_DEGRADED" }, \
173 { CXL_EVENT_RECORD_FLAG_HW_REPLACE, "HARDWARE_REPLACEMENT_NEEDED" } \
177 * Define macros for the common header of each CXL event.
179 * Tracepoints using these macros must do 3 things:
181 * 1) Add CXL_EVT_TP_entry to TP_STRUCT__entry
182 * 2) Use CXL_EVT_TP_fast_assign within TP_fast_assign;
183 * pass the dev, log, and CXL event header
184 * NOTE: The uuid must be assigned by the specific trace event
185 * 3) Use CXL_EVT_TP_printk() instead of TP_printk()
187 * See the generic_event tracepoint as an example.
189 #define CXL_EVT_TP_entry \
190 __string(memdev, dev_name(&cxlmd->dev)) \
191 __string(host, dev_name(cxlmd->dev.parent)) \
193 __field_struct(uuid_t, hdr_uuid) \
194 __field(u64, serial) \
195 __field(u32, hdr_flags) \
196 __field(u16, hdr_handle) \
197 __field(u16, hdr_related_handle) \
198 __field(u64, hdr_timestamp) \
199 __field(u8, hdr_length) \
200 __field(u8, hdr_maint_op_class)
202 #define CXL_EVT_TP_fast_assign(cxlmd, l, hdr) \
203 __assign_str(memdev); \
204 __assign_str(host); \
205 __entry->log = (l); \
206 __entry->serial = (cxlmd)->cxlds->serial; \
207 __entry->hdr_length = (hdr).length; \
208 __entry->hdr_flags = get_unaligned_le24((hdr).flags); \
209 __entry->hdr_handle = le16_to_cpu((hdr).handle); \
210 __entry->hdr_related_handle = le16_to_cpu((hdr).related_handle); \
211 __entry->hdr_timestamp = le64_to_cpu((hdr).timestamp); \
212 __entry->hdr_maint_op_class = (hdr).maint_op_class
214 #define CXL_EVT_TP_printk(fmt, ...) \
215 TP_printk("memdev=%s host=%s serial=%lld log=%s : time=%llu uuid=%pUb " \
216 "len=%d flags='%s' handle=%x related_handle=%x " \
217 "maint_op_class=%u : " fmt, \
218 __get_str(memdev), __get_str(host), __entry->serial, \
219 cxl_event_log_type_str(__entry->log), \
220 __entry->hdr_timestamp, &__entry->hdr_uuid, __entry->hdr_length,\
221 show_hdr_flags(__entry->hdr_flags), __entry->hdr_handle, \
222 __entry->hdr_related_handle, __entry->hdr_maint_op_class, \
225 TRACE_EVENT(cxl_generic_event
,
227 TP_PROTO(const struct cxl_memdev
*cxlmd
, enum cxl_event_log_type log
,
228 const uuid_t
*uuid
, struct cxl_event_generic
*gen_rec
),
230 TP_ARGS(cxlmd
, log
, uuid
, gen_rec
),
234 __array(u8
, data
, CXL_EVENT_RECORD_DATA_LENGTH
)
238 CXL_EVT_TP_fast_assign(cxlmd
, log
, gen_rec
->hdr
);
239 memcpy(&__entry
->hdr_uuid
, uuid
, sizeof(uuid_t
));
240 memcpy(__entry
->data
, gen_rec
->data
, CXL_EVENT_RECORD_DATA_LENGTH
);
243 CXL_EVT_TP_printk("%s",
244 __print_hex(__entry
->data
, CXL_EVENT_RECORD_DATA_LENGTH
))
248 * Physical Address field masks
250 * General Media Event Record
251 * CXL rev 3.0 Section 8.2.9.2.1.1; Table 8-43
254 * CXL rev 3.0 section 8.2.9.2.1.2; Table 8-44
256 #define CXL_DPA_FLAGS_MASK GENMASK(1, 0)
257 #define CXL_DPA_MASK GENMASK_ULL(63, 6)
259 #define CXL_DPA_VOLATILE BIT(0)
260 #define CXL_DPA_NOT_REPAIRABLE BIT(1)
261 #define show_dpa_flags(flags) __print_flags(flags, "|", \
262 { CXL_DPA_VOLATILE, "VOLATILE" }, \
263 { CXL_DPA_NOT_REPAIRABLE, "NOT_REPAIRABLE" } \
267 * General Media Event Record - GMER
268 * CXL rev 3.0 Section 8.2.9.2.1.1; Table 8-43
270 #define CXL_GMER_EVT_DESC_UNCORECTABLE_EVENT BIT(0)
271 #define CXL_GMER_EVT_DESC_THRESHOLD_EVENT BIT(1)
272 #define CXL_GMER_EVT_DESC_POISON_LIST_OVERFLOW BIT(2)
273 #define show_event_desc_flags(flags) __print_flags(flags, "|", \
274 { CXL_GMER_EVT_DESC_UNCORECTABLE_EVENT, "UNCORRECTABLE_EVENT" }, \
275 { CXL_GMER_EVT_DESC_THRESHOLD_EVENT, "THRESHOLD_EVENT" }, \
276 { CXL_GMER_EVT_DESC_POISON_LIST_OVERFLOW, "POISON_LIST_OVERFLOW" } \
279 #define CXL_GMER_MEM_EVT_TYPE_ECC_ERROR 0x00
280 #define CXL_GMER_MEM_EVT_TYPE_INV_ADDR 0x01
281 #define CXL_GMER_MEM_EVT_TYPE_DATA_PATH_ERROR 0x02
282 #define show_gmer_mem_event_type(type) __print_symbolic(type, \
283 { CXL_GMER_MEM_EVT_TYPE_ECC_ERROR, "ECC Error" }, \
284 { CXL_GMER_MEM_EVT_TYPE_INV_ADDR, "Invalid Address" }, \
285 { CXL_GMER_MEM_EVT_TYPE_DATA_PATH_ERROR, "Data Path Error" } \
288 #define CXL_GMER_TRANS_UNKNOWN 0x00
289 #define CXL_GMER_TRANS_HOST_READ 0x01
290 #define CXL_GMER_TRANS_HOST_WRITE 0x02
291 #define CXL_GMER_TRANS_HOST_SCAN_MEDIA 0x03
292 #define CXL_GMER_TRANS_HOST_INJECT_POISON 0x04
293 #define CXL_GMER_TRANS_INTERNAL_MEDIA_SCRUB 0x05
294 #define CXL_GMER_TRANS_INTERNAL_MEDIA_MANAGEMENT 0x06
295 #define show_trans_type(type) __print_symbolic(type, \
296 { CXL_GMER_TRANS_UNKNOWN, "Unknown" }, \
297 { CXL_GMER_TRANS_HOST_READ, "Host Read" }, \
298 { CXL_GMER_TRANS_HOST_WRITE, "Host Write" }, \
299 { CXL_GMER_TRANS_HOST_SCAN_MEDIA, "Host Scan Media" }, \
300 { CXL_GMER_TRANS_HOST_INJECT_POISON, "Host Inject Poison" }, \
301 { CXL_GMER_TRANS_INTERNAL_MEDIA_SCRUB, "Internal Media Scrub" }, \
302 { CXL_GMER_TRANS_INTERNAL_MEDIA_MANAGEMENT, "Internal Media Management" } \
305 #define CXL_GMER_VALID_CHANNEL BIT(0)
306 #define CXL_GMER_VALID_RANK BIT(1)
307 #define CXL_GMER_VALID_DEVICE BIT(2)
308 #define CXL_GMER_VALID_COMPONENT BIT(3)
309 #define show_valid_flags(flags) __print_flags(flags, "|", \
310 { CXL_GMER_VALID_CHANNEL, "CHANNEL" }, \
311 { CXL_GMER_VALID_RANK, "RANK" }, \
312 { CXL_GMER_VALID_DEVICE, "DEVICE" }, \
313 { CXL_GMER_VALID_COMPONENT, "COMPONENT" } \
316 TRACE_EVENT(cxl_general_media
,
318 TP_PROTO(const struct cxl_memdev
*cxlmd
, enum cxl_event_log_type log
,
319 struct cxl_region
*cxlr
, u64 hpa
, struct cxl_event_gen_media
*rec
),
321 TP_ARGS(cxlmd
, log
, cxlr
, hpa
, rec
),
327 __field(u8
, descriptor
)
329 __field(u8
, transaction_type
)
332 __array(u8
, comp_id
, CXL_EVENT_GEN_MED_COMP_ID_SIZE
)
333 /* Following are out of order to pack trace record */
335 __field_struct(uuid_t
, region_uuid
)
336 __field(u16
, validity_flags
)
338 __field(u8
, dpa_flags
)
339 __string(region_name
, cxlr
? dev_name(&cxlr
->dev
) : "")
343 CXL_EVT_TP_fast_assign(cxlmd
, log
, rec
->media_hdr
.hdr
);
344 __entry
->hdr_uuid
= CXL_EVENT_GEN_MEDIA_UUID
;
347 __entry
->dpa
= le64_to_cpu(rec
->media_hdr
.phys_addr
);
348 __entry
->dpa_flags
= __entry
->dpa
& CXL_DPA_FLAGS_MASK
;
349 /* Mask after flags have been parsed */
350 __entry
->dpa
&= CXL_DPA_MASK
;
351 __entry
->descriptor
= rec
->media_hdr
.descriptor
;
352 __entry
->type
= rec
->media_hdr
.type
;
353 __entry
->transaction_type
= rec
->media_hdr
.transaction_type
;
354 __entry
->channel
= rec
->media_hdr
.channel
;
355 __entry
->rank
= rec
->media_hdr
.rank
;
356 __entry
->device
= get_unaligned_le24(rec
->device
);
357 memcpy(__entry
->comp_id
, &rec
->component_id
,
358 CXL_EVENT_GEN_MED_COMP_ID_SIZE
);
359 __entry
->validity_flags
= get_unaligned_le16(&rec
->media_hdr
.validity_flags
);
362 __assign_str(region_name
);
363 uuid_copy(&__entry
->region_uuid
, &cxlr
->params
.uuid
);
365 __assign_str(region_name
);
366 uuid_copy(&__entry
->region_uuid
, &uuid_null
);
370 CXL_EVT_TP_printk("dpa=%llx dpa_flags='%s' " \
371 "descriptor='%s' type='%s' transaction_type='%s' channel=%u rank=%u " \
372 "device=%x comp_id=%s validity_flags='%s' " \
373 "hpa=%llx region=%s region_uuid=%pUb",
374 __entry
->dpa
, show_dpa_flags(__entry
->dpa_flags
),
375 show_event_desc_flags(__entry
->descriptor
),
376 show_gmer_mem_event_type(__entry
->type
),
377 show_trans_type(__entry
->transaction_type
),
378 __entry
->channel
, __entry
->rank
, __entry
->device
,
379 __print_hex(__entry
->comp_id
, CXL_EVENT_GEN_MED_COMP_ID_SIZE
),
380 show_valid_flags(__entry
->validity_flags
),
381 __entry
->hpa
, __get_str(region_name
), &__entry
->region_uuid
386 * DRAM Event Record - DER
388 * CXL rev 3.0 section 8.2.9.2.1.2; Table 8-44
391 * DRAM Event Record defines many fields the same as the General Media Event
392 * Record. Reuse those definitions as appropriate.
394 #define CXL_DER_MEM_EVT_TYPE_ECC_ERROR 0x00
395 #define CXL_DER_MEM_EVT_TYPE_SCRUB_MEDIA_ECC_ERROR 0x01
396 #define CXL_DER_MEM_EVT_TYPE_INV_ADDR 0x02
397 #define CXL_DER_MEM_EVT_TYPE_DATA_PATH_ERROR 0x03
398 #define show_dram_mem_event_type(type) __print_symbolic(type, \
399 { CXL_DER_MEM_EVT_TYPE_ECC_ERROR, "ECC Error" }, \
400 { CXL_DER_MEM_EVT_TYPE_SCRUB_MEDIA_ECC_ERROR, "Scrub Media ECC Error" }, \
401 { CXL_DER_MEM_EVT_TYPE_INV_ADDR, "Invalid Address" }, \
402 { CXL_DER_MEM_EVT_TYPE_DATA_PATH_ERROR, "Data Path Error" } \
405 #define CXL_DER_VALID_CHANNEL BIT(0)
406 #define CXL_DER_VALID_RANK BIT(1)
407 #define CXL_DER_VALID_NIBBLE BIT(2)
408 #define CXL_DER_VALID_BANK_GROUP BIT(3)
409 #define CXL_DER_VALID_BANK BIT(4)
410 #define CXL_DER_VALID_ROW BIT(5)
411 #define CXL_DER_VALID_COLUMN BIT(6)
412 #define CXL_DER_VALID_CORRECTION_MASK BIT(7)
413 #define show_dram_valid_flags(flags) __print_flags(flags, "|", \
414 { CXL_DER_VALID_CHANNEL, "CHANNEL" }, \
415 { CXL_DER_VALID_RANK, "RANK" }, \
416 { CXL_DER_VALID_NIBBLE, "NIBBLE" }, \
417 { CXL_DER_VALID_BANK_GROUP, "BANK GROUP" }, \
418 { CXL_DER_VALID_BANK, "BANK" }, \
419 { CXL_DER_VALID_ROW, "ROW" }, \
420 { CXL_DER_VALID_COLUMN, "COLUMN" }, \
421 { CXL_DER_VALID_CORRECTION_MASK, "CORRECTION MASK" } \
424 TRACE_EVENT(cxl_dram
,
426 TP_PROTO(const struct cxl_memdev
*cxlmd
, enum cxl_event_log_type log
,
427 struct cxl_region
*cxlr
, u64 hpa
, struct cxl_event_dram
*rec
),
429 TP_ARGS(cxlmd
, log
, cxlr
, hpa
, rec
),
435 __field(u8
, descriptor
)
437 __field(u8
, transaction_type
)
439 __field(u16
, validity_flags
)
440 __field(u16
, column
) /* Out of order to pack trace record */
441 __field(u32
, nibble_mask
)
443 __array(u8
, cor_mask
, CXL_EVENT_DER_CORRECTION_MASK_SIZE
)
445 __field_struct(uuid_t
, region_uuid
)
446 __field(u8
, rank
) /* Out of order to pack trace record */
447 __field(u8
, bank_group
) /* Out of order to pack trace record */
448 __field(u8
, bank
) /* Out of order to pack trace record */
449 __field(u8
, dpa_flags
) /* Out of order to pack trace record */
450 __string(region_name
, cxlr
? dev_name(&cxlr
->dev
) : "")
454 CXL_EVT_TP_fast_assign(cxlmd
, log
, rec
->media_hdr
.hdr
);
455 __entry
->hdr_uuid
= CXL_EVENT_DRAM_UUID
;
458 __entry
->dpa
= le64_to_cpu(rec
->media_hdr
.phys_addr
);
459 __entry
->dpa_flags
= __entry
->dpa
& CXL_DPA_FLAGS_MASK
;
460 __entry
->dpa
&= CXL_DPA_MASK
;
461 __entry
->descriptor
= rec
->media_hdr
.descriptor
;
462 __entry
->type
= rec
->media_hdr
.type
;
463 __entry
->transaction_type
= rec
->media_hdr
.transaction_type
;
464 __entry
->validity_flags
= get_unaligned_le16(rec
->media_hdr
.validity_flags
);
465 __entry
->channel
= rec
->media_hdr
.channel
;
466 __entry
->rank
= rec
->media_hdr
.rank
;
467 __entry
->nibble_mask
= get_unaligned_le24(rec
->nibble_mask
);
468 __entry
->bank_group
= rec
->bank_group
;
469 __entry
->bank
= rec
->bank
;
470 __entry
->row
= get_unaligned_le24(rec
->row
);
471 __entry
->column
= get_unaligned_le16(rec
->column
);
472 memcpy(__entry
->cor_mask
, &rec
->correction_mask
,
473 CXL_EVENT_DER_CORRECTION_MASK_SIZE
);
476 __assign_str(region_name
);
477 uuid_copy(&__entry
->region_uuid
, &cxlr
->params
.uuid
);
479 __assign_str(region_name
);
480 uuid_copy(&__entry
->region_uuid
, &uuid_null
);
484 CXL_EVT_TP_printk("dpa=%llx dpa_flags='%s' descriptor='%s' type='%s' " \
485 "transaction_type='%s' channel=%u rank=%u nibble_mask=%x " \
486 "bank_group=%u bank=%u row=%u column=%u cor_mask=%s " \
487 "validity_flags='%s' " \
488 "hpa=%llx region=%s region_uuid=%pUb",
489 __entry
->dpa
, show_dpa_flags(__entry
->dpa_flags
),
490 show_event_desc_flags(__entry
->descriptor
),
491 show_dram_mem_event_type(__entry
->type
),
492 show_trans_type(__entry
->transaction_type
),
493 __entry
->channel
, __entry
->rank
, __entry
->nibble_mask
,
494 __entry
->bank_group
, __entry
->bank
,
495 __entry
->row
, __entry
->column
,
496 __print_hex(__entry
->cor_mask
, CXL_EVENT_DER_CORRECTION_MASK_SIZE
),
497 show_dram_valid_flags(__entry
->validity_flags
),
498 __entry
->hpa
, __get_str(region_name
), &__entry
->region_uuid
503 * Memory Module Event Record - MMER
505 * CXL res 3.0 section 8.2.9.2.1.3; Table 8-45
507 #define CXL_MMER_HEALTH_STATUS_CHANGE 0x00
508 #define CXL_MMER_MEDIA_STATUS_CHANGE 0x01
509 #define CXL_MMER_LIFE_USED_CHANGE 0x02
510 #define CXL_MMER_TEMP_CHANGE 0x03
511 #define CXL_MMER_DATA_PATH_ERROR 0x04
512 #define CXL_MMER_LSA_ERROR 0x05
513 #define show_dev_evt_type(type) __print_symbolic(type, \
514 { CXL_MMER_HEALTH_STATUS_CHANGE, "Health Status Change" }, \
515 { CXL_MMER_MEDIA_STATUS_CHANGE, "Media Status Change" }, \
516 { CXL_MMER_LIFE_USED_CHANGE, "Life Used Change" }, \
517 { CXL_MMER_TEMP_CHANGE, "Temperature Change" }, \
518 { CXL_MMER_DATA_PATH_ERROR, "Data Path Error" }, \
519 { CXL_MMER_LSA_ERROR, "LSA Error" } \
523 * Device Health Information - DHI
525 * CXL res 3.0 section 8.2.9.8.3.1; Table 8-100
527 #define CXL_DHI_HS_MAINTENANCE_NEEDED BIT(0)
528 #define CXL_DHI_HS_PERFORMANCE_DEGRADED BIT(1)
529 #define CXL_DHI_HS_HW_REPLACEMENT_NEEDED BIT(2)
530 #define show_health_status_flags(flags) __print_flags(flags, "|", \
531 { CXL_DHI_HS_MAINTENANCE_NEEDED, "MAINTENANCE_NEEDED" }, \
532 { CXL_DHI_HS_PERFORMANCE_DEGRADED, "PERFORMANCE_DEGRADED" }, \
533 { CXL_DHI_HS_HW_REPLACEMENT_NEEDED, "REPLACEMENT_NEEDED" } \
536 #define CXL_DHI_MS_NORMAL 0x00
537 #define CXL_DHI_MS_NOT_READY 0x01
538 #define CXL_DHI_MS_WRITE_PERSISTENCY_LOST 0x02
539 #define CXL_DHI_MS_ALL_DATA_LOST 0x03
540 #define CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_EVENT_POWER_LOSS 0x04
541 #define CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_EVENT_SHUTDOWN 0x05
542 #define CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_IMMINENT 0x06
543 #define CXL_DHI_MS_WRITE_ALL_DATA_LOSS_EVENT_POWER_LOSS 0x07
544 #define CXL_DHI_MS_WRITE_ALL_DATA_LOSS_EVENT_SHUTDOWN 0x08
545 #define CXL_DHI_MS_WRITE_ALL_DATA_LOSS_IMMINENT 0x09
546 #define show_media_status(ms) __print_symbolic(ms, \
547 { CXL_DHI_MS_NORMAL, \
549 { CXL_DHI_MS_NOT_READY, \
551 { CXL_DHI_MS_WRITE_PERSISTENCY_LOST, \
552 "Write Persistency Lost" }, \
553 { CXL_DHI_MS_ALL_DATA_LOST, \
555 { CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_EVENT_POWER_LOSS, \
556 "Write Persistency Loss in the Event of Power Loss" }, \
557 { CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_EVENT_SHUTDOWN, \
558 "Write Persistency Loss in Event of Shutdown" }, \
559 { CXL_DHI_MS_WRITE_PERSISTENCY_LOSS_IMMINENT, \
560 "Write Persistency Loss Imminent" }, \
561 { CXL_DHI_MS_WRITE_ALL_DATA_LOSS_EVENT_POWER_LOSS, \
562 "All Data Loss in Event of Power Loss" }, \
563 { CXL_DHI_MS_WRITE_ALL_DATA_LOSS_EVENT_SHUTDOWN, \
564 "All Data loss in the Event of Shutdown" }, \
565 { CXL_DHI_MS_WRITE_ALL_DATA_LOSS_IMMINENT, \
566 "All Data Loss Imminent" } \
569 #define CXL_DHI_AS_NORMAL 0x0
570 #define CXL_DHI_AS_WARNING 0x1
571 #define CXL_DHI_AS_CRITICAL 0x2
572 #define show_two_bit_status(as) __print_symbolic(as, \
573 { CXL_DHI_AS_NORMAL, "Normal" }, \
574 { CXL_DHI_AS_WARNING, "Warning" }, \
575 { CXL_DHI_AS_CRITICAL, "Critical" } \
577 #define show_one_bit_status(as) __print_symbolic(as, \
578 { CXL_DHI_AS_NORMAL, "Normal" }, \
579 { CXL_DHI_AS_WARNING, "Warning" } \
582 #define CXL_DHI_AS_LIFE_USED(as) (as & 0x3)
583 #define CXL_DHI_AS_DEV_TEMP(as) ((as & 0xC) >> 2)
584 #define CXL_DHI_AS_COR_VOL_ERR_CNT(as) ((as & 0x10) >> 4)
585 #define CXL_DHI_AS_COR_PER_ERR_CNT(as) ((as & 0x20) >> 5)
587 TRACE_EVENT(cxl_memory_module
,
589 TP_PROTO(const struct cxl_memdev
*cxlmd
, enum cxl_event_log_type log
,
590 struct cxl_event_mem_module
*rec
),
592 TP_ARGS(cxlmd
, log
, rec
),
597 /* Memory Module Event */
598 __field(u8
, event_type
)
600 /* Device Health Info */
601 __field(u8
, health_status
)
602 __field(u8
, media_status
)
603 __field(u8
, life_used
)
604 __field(u32
, dirty_shutdown_cnt
)
605 __field(u32
, cor_vol_err_cnt
)
606 __field(u32
, cor_per_err_cnt
)
607 __field(s16
, device_temp
)
608 __field(u8
, add_status
)
612 CXL_EVT_TP_fast_assign(cxlmd
, log
, rec
->hdr
);
613 __entry
->hdr_uuid
= CXL_EVENT_MEM_MODULE_UUID
;
615 /* Memory Module Event */
616 __entry
->event_type
= rec
->event_type
;
618 /* Device Health Info */
619 __entry
->health_status
= rec
->info
.health_status
;
620 __entry
->media_status
= rec
->info
.media_status
;
621 __entry
->life_used
= rec
->info
.life_used
;
622 __entry
->dirty_shutdown_cnt
= get_unaligned_le32(rec
->info
.dirty_shutdown_cnt
);
623 __entry
->cor_vol_err_cnt
= get_unaligned_le32(rec
->info
.cor_vol_err_cnt
);
624 __entry
->cor_per_err_cnt
= get_unaligned_le32(rec
->info
.cor_per_err_cnt
);
625 __entry
->device_temp
= get_unaligned_le16(rec
->info
.device_temp
);
626 __entry
->add_status
= rec
->info
.add_status
;
629 CXL_EVT_TP_printk("event_type='%s' health_status='%s' media_status='%s' " \
630 "as_life_used=%s as_dev_temp=%s as_cor_vol_err_cnt=%s " \
631 "as_cor_per_err_cnt=%s life_used=%u device_temp=%d " \
632 "dirty_shutdown_cnt=%u cor_vol_err_cnt=%u cor_per_err_cnt=%u",
633 show_dev_evt_type(__entry
->event_type
),
634 show_health_status_flags(__entry
->health_status
),
635 show_media_status(__entry
->media_status
),
636 show_two_bit_status(CXL_DHI_AS_LIFE_USED(__entry
->add_status
)),
637 show_two_bit_status(CXL_DHI_AS_DEV_TEMP(__entry
->add_status
)),
638 show_one_bit_status(CXL_DHI_AS_COR_VOL_ERR_CNT(__entry
->add_status
)),
639 show_one_bit_status(CXL_DHI_AS_COR_PER_ERR_CNT(__entry
->add_status
)),
640 __entry
->life_used
, __entry
->device_temp
,
641 __entry
->dirty_shutdown_cnt
, __entry
->cor_vol_err_cnt
,
642 __entry
->cor_per_err_cnt
646 #define show_poison_trace_type(type) \
647 __print_symbolic(type, \
648 { CXL_POISON_TRACE_LIST, "List" }, \
649 { CXL_POISON_TRACE_INJECT, "Inject" }, \
650 { CXL_POISON_TRACE_CLEAR, "Clear" })
652 #define __show_poison_source(source) \
653 __print_symbolic(source, \
654 { CXL_POISON_SOURCE_UNKNOWN, "Unknown" }, \
655 { CXL_POISON_SOURCE_EXTERNAL, "External" }, \
656 { CXL_POISON_SOURCE_INTERNAL, "Internal" }, \
657 { CXL_POISON_SOURCE_INJECTED, "Injected" }, \
658 { CXL_POISON_SOURCE_VENDOR, "Vendor" })
660 #define show_poison_source(source) \
661 (((source > CXL_POISON_SOURCE_INJECTED) && \
662 (source != CXL_POISON_SOURCE_VENDOR)) ? "Reserved" \
663 : __show_poison_source(source))
665 #define show_poison_flags(flags) \
666 __print_flags(flags, "|", \
667 { CXL_POISON_FLAG_MORE, "More" }, \
668 { CXL_POISON_FLAG_OVERFLOW, "Overflow" }, \
669 { CXL_POISON_FLAG_SCANNING, "Scanning" })
671 #define __cxl_poison_addr(record) \
672 (le64_to_cpu(record->address))
673 #define cxl_poison_record_dpa(record) \
674 (__cxl_poison_addr(record) & CXL_POISON_START_MASK)
675 #define cxl_poison_record_source(record) \
676 (__cxl_poison_addr(record) & CXL_POISON_SOURCE_MASK)
677 #define cxl_poison_record_dpa_length(record) \
678 (le32_to_cpu(record->length) * CXL_POISON_LEN_MULT)
679 #define cxl_poison_overflow(flags, time) \
680 (flags & CXL_POISON_FLAG_OVERFLOW ? le64_to_cpu(time) : 0)
682 TRACE_EVENT(cxl_poison
,
684 TP_PROTO(struct cxl_memdev
*cxlmd
, struct cxl_region
*cxlr
,
685 const struct cxl_poison_record
*record
, u8 flags
,
686 __le64 overflow_ts
, enum cxl_poison_trace_type trace_type
),
688 TP_ARGS(cxlmd
, cxlr
, record
, flags
, overflow_ts
, trace_type
),
691 __string(memdev
, dev_name(&cxlmd
->dev
))
692 __string(host
, dev_name(cxlmd
->dev
.parent
))
694 __field(u8
, trace_type
)
695 __string(region
, cxlr
? dev_name(&cxlr
->dev
) : "")
696 __field(u64
, overflow_ts
)
699 __field(u32
, dpa_length
)
700 __array(char, uuid
, 16)
706 __assign_str(memdev
);
708 __entry
->serial
= cxlmd
->cxlds
->serial
;
709 __entry
->overflow_ts
= cxl_poison_overflow(flags
, overflow_ts
);
710 __entry
->dpa
= cxl_poison_record_dpa(record
);
711 __entry
->dpa_length
= cxl_poison_record_dpa_length(record
);
712 __entry
->source
= cxl_poison_record_source(record
);
713 __entry
->trace_type
= trace_type
;
714 __entry
->flags
= flags
;
716 __assign_str(region
);
717 memcpy(__entry
->uuid
, &cxlr
->params
.uuid
, 16);
718 __entry
->hpa
= cxl_dpa_to_hpa(cxlr
, cxlmd
,
721 __assign_str(region
);
722 memset(__entry
->uuid
, 0, 16);
723 __entry
->hpa
= ULLONG_MAX
;
727 TP_printk("memdev=%s host=%s serial=%lld trace_type=%s region=%s " \
728 "region_uuid=%pU hpa=0x%llx dpa=0x%llx dpa_length=0x%x " \
729 "source=%s flags=%s overflow_time=%llu",
733 show_poison_trace_type(__entry
->trace_type
),
739 show_poison_source(__entry
->source
),
740 show_poison_flags(__entry
->flags
),
745 #endif /* _CXL_EVENTS_H */
747 #define TRACE_INCLUDE_FILE trace
748 #include <trace/define_trace.h>