4 * Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp>
5 * VA Linux Systems Japan K.K.
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License along
18 * with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "qemu/osdep.h"
22 #include "hw/pci/msi.h"
23 #include "hw/xen/xen.h"
24 #include "qemu/range.h"
25 #include "qapi/error.h"
26 #include "sysemu/xen.h"
28 #include "hw/i386/kvm/xen_evtchn.h"
30 /* PCI_MSI_ADDRESS_LO */
31 #define PCI_MSI_ADDRESS_LO_MASK (~0x3)
33 /* If we get rid of cap allocator, we won't need those. */
34 #define PCI_MSI_32_SIZEOF 0x0a
35 #define PCI_MSI_64_SIZEOF 0x0e
36 #define PCI_MSI_32M_SIZEOF 0x14
37 #define PCI_MSI_64M_SIZEOF 0x18
39 #define PCI_MSI_VECTORS_MAX 32
42 * Flag for interrupt controllers to declare broken MSI/MSI-X support.
43 * values: false - broken; true - non-broken.
45 * Setting this flag to false will remove MSI/MSI-X capability from all devices.
47 * It is preferable for controllers to set this to true (non-broken) even if
48 * they do not actually support MSI/MSI-X: guests normally probe the controller
49 * type and do not attempt to enable MSI/MSI-X with interrupt controllers not
50 * supporting such, so removing the capability is not required, and
51 * it seems cleaner to have a given device look the same for all boards.
53 * TODO: some existing controllers violate the above rule. Identify and fix them.
57 /* If we get rid of cap allocator, we won't need this. */
58 static inline uint8_t msi_cap_sizeof(uint16_t flags
)
60 switch (flags
& (PCI_MSI_FLAGS_MASKBIT
| PCI_MSI_FLAGS_64BIT
)) {
61 case PCI_MSI_FLAGS_MASKBIT
| PCI_MSI_FLAGS_64BIT
:
62 return PCI_MSI_64M_SIZEOF
;
63 case PCI_MSI_FLAGS_64BIT
:
64 return PCI_MSI_64_SIZEOF
;
65 case PCI_MSI_FLAGS_MASKBIT
:
66 return PCI_MSI_32M_SIZEOF
;
68 return PCI_MSI_32_SIZEOF
;
79 # define MSI_DPRINTF(fmt, ...) \
80 fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__)
82 # define MSI_DPRINTF(fmt, ...) do { } while (0)
84 #define MSI_DEV_PRINTF(dev, fmt, ...) \
85 MSI_DPRINTF("%s:%x " fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__)
87 static inline unsigned int msi_nr_vectors(uint16_t flags
)
90 ((flags
& PCI_MSI_FLAGS_QSIZE
) >> ctz32(PCI_MSI_FLAGS_QSIZE
));
93 static inline uint8_t msi_flags_off(const PCIDevice
* dev
)
95 return dev
->msi_cap
+ PCI_MSI_FLAGS
;
98 static inline uint8_t msi_address_lo_off(const PCIDevice
* dev
)
100 return dev
->msi_cap
+ PCI_MSI_ADDRESS_LO
;
103 static inline uint8_t msi_address_hi_off(const PCIDevice
* dev
)
105 return dev
->msi_cap
+ PCI_MSI_ADDRESS_HI
;
108 static inline uint8_t msi_data_off(const PCIDevice
* dev
, bool msi64bit
)
110 return dev
->msi_cap
+ (msi64bit
? PCI_MSI_DATA_64
: PCI_MSI_DATA_32
);
113 static inline uint8_t msi_mask_off(const PCIDevice
* dev
, bool msi64bit
)
115 return dev
->msi_cap
+ (msi64bit
? PCI_MSI_MASK_64
: PCI_MSI_MASK_32
);
118 static inline uint8_t msi_pending_off(const PCIDevice
* dev
, bool msi64bit
)
120 return dev
->msi_cap
+ (msi64bit
? PCI_MSI_PENDING_64
: PCI_MSI_PENDING_32
);
124 * Special API for POWER to configure the vectors through
125 * a side channel. Should never be used by devices.
127 void msi_set_message(PCIDevice
*dev
, MSIMessage msg
)
129 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
130 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
133 pci_set_quad(dev
->config
+ msi_address_lo_off(dev
), msg
.address
);
135 pci_set_long(dev
->config
+ msi_address_lo_off(dev
), msg
.address
);
137 pci_set_word(dev
->config
+ msi_data_off(dev
, msi64bit
), msg
.data
);
140 static MSIMessage
msi_prepare_message(PCIDevice
*dev
, unsigned int vector
)
142 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
143 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
144 unsigned int nr_vectors
= msi_nr_vectors(flags
);
147 assert(vector
< nr_vectors
);
150 msg
.address
= pci_get_quad(dev
->config
+ msi_address_lo_off(dev
));
152 msg
.address
= pci_get_long(dev
->config
+ msi_address_lo_off(dev
));
155 /* upper bit 31:16 is zero */
156 msg
.data
= pci_get_word(dev
->config
+ msi_data_off(dev
, msi64bit
));
157 if (nr_vectors
> 1) {
158 msg
.data
&= ~(nr_vectors
- 1);
165 MSIMessage
msi_get_message(PCIDevice
*dev
, unsigned int vector
)
167 return dev
->msi_prepare_message(dev
, vector
);
170 bool msi_enabled(const PCIDevice
*dev
)
172 return msi_present(dev
) &&
173 (pci_get_word(dev
->config
+ msi_flags_off(dev
)) &
174 PCI_MSI_FLAGS_ENABLE
);
178 * Make PCI device @dev MSI-capable.
179 * Non-zero @offset puts capability MSI at that offset in PCI config
181 * @nr_vectors is the number of MSI vectors (1, 2, 4, 8, 16 or 32).
182 * If @msi64bit, make the device capable of sending a 64-bit message
184 * If @msi_per_vector_mask, make the device support per-vector masking.
185 * @errp is for returning errors.
186 * Return 0 on success; set @errp and return -errno on error.
188 * -ENOTSUP means lacking msi support for a msi-capable platform.
189 * -EINVAL means capability overlap, happens when @offset is non-zero,
190 * also means a programming error, except device assignment, which can check
191 * if a real HW is broken.
193 int msi_init(struct PCIDevice
*dev
, uint8_t offset
,
194 unsigned int nr_vectors
, bool msi64bit
,
195 bool msi_per_vector_mask
, Error
**errp
)
197 unsigned int vectors_order
;
202 if (!msi_nonbroken
) {
203 error_setg(errp
, "MSI is not supported by interrupt controller");
208 "init offset: 0x%"PRIx8
" vector: %"PRId8
209 " 64bit %d mask %d\n",
210 offset
, nr_vectors
, msi64bit
, msi_per_vector_mask
);
212 assert(!(nr_vectors
& (nr_vectors
- 1))); /* power of 2 */
213 assert(nr_vectors
> 0);
214 assert(nr_vectors
<= PCI_MSI_VECTORS_MAX
);
215 /* the nr of MSI vectors is up to 32 */
216 vectors_order
= ctz32(nr_vectors
);
218 flags
= vectors_order
<< ctz32(PCI_MSI_FLAGS_QMASK
);
220 flags
|= PCI_MSI_FLAGS_64BIT
;
222 if (msi_per_vector_mask
) {
223 flags
|= PCI_MSI_FLAGS_MASKBIT
;
226 cap_size
= msi_cap_sizeof(flags
);
227 config_offset
= pci_add_capability(dev
, PCI_CAP_ID_MSI
, offset
,
229 if (config_offset
< 0) {
230 return config_offset
;
233 dev
->msi_cap
= config_offset
;
234 dev
->cap_present
|= QEMU_PCI_CAP_MSI
;
236 pci_set_word(dev
->config
+ msi_flags_off(dev
), flags
);
237 pci_set_word(dev
->wmask
+ msi_flags_off(dev
),
238 PCI_MSI_FLAGS_QSIZE
| PCI_MSI_FLAGS_ENABLE
);
239 pci_set_long(dev
->wmask
+ msi_address_lo_off(dev
),
240 PCI_MSI_ADDRESS_LO_MASK
);
242 pci_set_long(dev
->wmask
+ msi_address_hi_off(dev
), 0xffffffff);
244 pci_set_word(dev
->wmask
+ msi_data_off(dev
, msi64bit
), 0xffff);
246 if (msi_per_vector_mask
) {
247 /* Make mask bits 0 to nr_vectors - 1 writable. */
248 pci_set_long(dev
->wmask
+ msi_mask_off(dev
, msi64bit
),
249 0xffffffff >> (PCI_MSI_VECTORS_MAX
- nr_vectors
));
252 dev
->msi_prepare_message
= msi_prepare_message
;
257 void msi_uninit(struct PCIDevice
*dev
)
262 if (!msi_present(dev
)) {
265 flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
266 cap_size
= msi_cap_sizeof(flags
);
267 pci_del_capability(dev
, PCI_CAP_ID_MSI
, cap_size
);
268 dev
->cap_present
&= ~QEMU_PCI_CAP_MSI
;
269 dev
->msi_prepare_message
= NULL
;
271 MSI_DEV_PRINTF(dev
, "uninit\n");
274 void msi_reset(PCIDevice
*dev
)
279 if (!msi_present(dev
)) {
283 flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
284 flags
&= ~(PCI_MSI_FLAGS_QSIZE
| PCI_MSI_FLAGS_ENABLE
);
285 msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
287 pci_set_word(dev
->config
+ msi_flags_off(dev
), flags
);
288 pci_set_long(dev
->config
+ msi_address_lo_off(dev
), 0);
290 pci_set_long(dev
->config
+ msi_address_hi_off(dev
), 0);
292 pci_set_word(dev
->config
+ msi_data_off(dev
, msi64bit
), 0);
293 if (flags
& PCI_MSI_FLAGS_MASKBIT
) {
294 pci_set_long(dev
->config
+ msi_mask_off(dev
, msi64bit
), 0);
295 pci_set_long(dev
->config
+ msi_pending_off(dev
, msi64bit
), 0);
297 MSI_DEV_PRINTF(dev
, "reset\n");
300 bool msi_is_masked(const PCIDevice
*dev
, unsigned int vector
)
302 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
304 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
305 assert(vector
< PCI_MSI_VECTORS_MAX
);
307 if (!(flags
& PCI_MSI_FLAGS_MASKBIT
)) {
311 data
= pci_get_word(dev
->config
+ msi_data_off(dev
, msi64bit
));
312 if (xen_enabled() && xen_is_pirq_msi(data
)) {
316 mask
= pci_get_long(dev
->config
+
317 msi_mask_off(dev
, flags
& PCI_MSI_FLAGS_64BIT
));
318 return mask
& (1U << vector
);
321 void msi_set_mask(PCIDevice
*dev
, int vector
, bool mask
, Error
**errp
)
323 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
324 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
325 uint32_t irq_state
, vector_mask
, pending
;
327 if (vector
>= PCI_MSI_VECTORS_MAX
) {
328 error_setg(errp
, "msi: vector %d not allocated. max vector is %d",
329 vector
, (PCI_MSI_VECTORS_MAX
- 1));
333 vector_mask
= (1U << vector
);
335 irq_state
= pci_get_long(dev
->config
+ msi_mask_off(dev
, msi64bit
));
338 irq_state
|= vector_mask
;
340 irq_state
&= ~vector_mask
;
343 pci_set_long(dev
->config
+ msi_mask_off(dev
, msi64bit
), irq_state
);
345 pending
= pci_get_long(dev
->config
+ msi_pending_off(dev
, msi64bit
));
346 if (!mask
&& (pending
& vector_mask
)) {
347 pending
&= ~vector_mask
;
348 pci_set_long(dev
->config
+ msi_pending_off(dev
, msi64bit
), pending
);
349 msi_notify(dev
, vector
);
353 void msi_notify(PCIDevice
*dev
, unsigned int vector
)
355 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
356 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
357 unsigned int nr_vectors
= msi_nr_vectors(flags
);
360 assert(vector
< nr_vectors
);
361 if (msi_is_masked(dev
, vector
)) {
362 assert(flags
& PCI_MSI_FLAGS_MASKBIT
);
363 pci_long_test_and_set_mask(
364 dev
->config
+ msi_pending_off(dev
, msi64bit
), 1U << vector
);
365 MSI_DEV_PRINTF(dev
, "pending vector 0x%x\n", vector
);
369 msg
= msi_get_message(dev
, vector
);
373 " address: 0x%"PRIx64
" data: 0x%"PRIx32
"\n",
374 vector
, msg
.address
, msg
.data
);
375 msi_send_message(dev
, msg
);
378 void msi_send_message(PCIDevice
*dev
, MSIMessage msg
)
380 dev
->msi_trigger(dev
, msg
);
383 /* Normally called by pci_default_write_config(). */
384 void msi_write_config(PCIDevice
*dev
, uint32_t addr
, uint32_t val
, int len
)
386 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
387 bool msi64bit
= flags
& PCI_MSI_FLAGS_64BIT
;
388 bool msi_per_vector_mask
= flags
& PCI_MSI_FLAGS_MASKBIT
;
389 unsigned int nr_vectors
;
390 uint8_t log_num_vecs
;
391 uint8_t log_max_vecs
;
395 if (!msi_present(dev
) ||
396 !ranges_overlap(addr
, len
, dev
->msi_cap
, msi_cap_sizeof(flags
))) {
401 MSI_DEV_PRINTF(dev
, "addr 0x%"PRIx32
" val 0x%"PRIx32
" len %d\n",
403 MSI_DEV_PRINTF(dev
, "ctrl: 0x%"PRIx16
" address: 0x%"PRIx32
,
405 pci_get_long(dev
->config
+ msi_address_lo_off(dev
)));
407 fprintf(stderr
, " address-hi: 0x%"PRIx32
,
408 pci_get_long(dev
->config
+ msi_address_hi_off(dev
)));
410 fprintf(stderr
, " data: 0x%"PRIx16
,
411 pci_get_word(dev
->config
+ msi_data_off(dev
, msi64bit
)));
412 if (flags
& PCI_MSI_FLAGS_MASKBIT
) {
413 fprintf(stderr
, " mask 0x%"PRIx32
" pending 0x%"PRIx32
,
414 pci_get_long(dev
->config
+ msi_mask_off(dev
, msi64bit
)),
415 pci_get_long(dev
->config
+ msi_pending_off(dev
, msi64bit
)));
417 fprintf(stderr
, "\n");
420 if (xen_mode
== XEN_EMULATE
) {
421 for (vector
= 0; vector
< msi_nr_vectors(flags
); vector
++) {
422 MSIMessage msg
= msi_prepare_message(dev
, vector
);
424 xen_evtchn_snoop_msi(dev
, false, vector
, msg
.address
, msg
.data
,
425 msi_is_masked(dev
, vector
));
429 if (!(flags
& PCI_MSI_FLAGS_ENABLE
)) {
434 * Now MSI is enabled, clear INTx# interrupts.
435 * the driver is prohibited from writing enable bit to mask
436 * a service request. But the guest OS could do this.
437 * So we just discard the interrupts as moderate fallback.
439 * 6.8.3.3. Enabling Operation
440 * While enabled for MSI or MSI-X operation, a function is prohibited
441 * from using its INTx# pin (if implemented) to request
442 * service (MSI, MSI-X, and INTx# are mutually exclusive).
444 pci_device_deassert_intx(dev
);
447 * nr_vectors might be set bigger than capable. So clamp it.
448 * This is not legal by spec, so we can do anything we like,
449 * just don't crash the host
452 (flags
& PCI_MSI_FLAGS_QSIZE
) >> ctz32(PCI_MSI_FLAGS_QSIZE
);
454 (flags
& PCI_MSI_FLAGS_QMASK
) >> ctz32(PCI_MSI_FLAGS_QMASK
);
455 if (log_num_vecs
> log_max_vecs
) {
456 flags
&= ~PCI_MSI_FLAGS_QSIZE
;
457 flags
|= log_max_vecs
<< ctz32(PCI_MSI_FLAGS_QSIZE
);
458 pci_set_word(dev
->config
+ msi_flags_off(dev
), flags
);
461 if (!msi_per_vector_mask
) {
462 /* if per vector masking isn't supported,
463 there is no pending interrupt. */
467 nr_vectors
= msi_nr_vectors(flags
);
469 /* This will discard pending interrupts, if any. */
470 pending
= pci_get_long(dev
->config
+ msi_pending_off(dev
, msi64bit
));
471 pending
&= 0xffffffff >> (PCI_MSI_VECTORS_MAX
- nr_vectors
);
472 pci_set_long(dev
->config
+ msi_pending_off(dev
, msi64bit
), pending
);
474 /* deliver pending interrupts which are unmasked */
475 for (vector
= 0; vector
< nr_vectors
; ++vector
) {
476 if (msi_is_masked(dev
, vector
) || !(pending
& (1U << vector
))) {
480 pci_long_test_and_clear_mask(
481 dev
->config
+ msi_pending_off(dev
, msi64bit
), 1U << vector
);
482 msi_notify(dev
, vector
);
486 unsigned int msi_nr_vectors_allocated(const PCIDevice
*dev
)
488 uint16_t flags
= pci_get_word(dev
->config
+ msi_flags_off(dev
));
489 return msi_nr_vectors(flags
);