Merge branch 'fixes' of git://git.kernel.org/pub/scm/linux/kernel/git/evalenti/linux...
[linux/fpc-iii.git] / drivers / xen / xen-pciback / xenbus.c
blobc252eb3f01767a4cb3ed906b884306cd3d83b20a
1 /*
2 * PCI Backend Xenbus Setup - handles setup with frontend and xend
4 * Author: Ryan Wilson <hap9@epoch.ncsc.mil>
5 */
7 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
9 #include <linux/moduleparam.h>
10 #include <linux/init.h>
11 #include <linux/list.h>
12 #include <linux/vmalloc.h>
13 #include <linux/workqueue.h>
14 #include <xen/xenbus.h>
15 #include <xen/events.h>
16 #include <asm/xen/pci.h>
17 #include "pciback.h"
19 #define INVALID_EVTCHN_IRQ (-1)
20 struct workqueue_struct *xen_pcibk_wq;
22 static bool __read_mostly passthrough;
23 module_param(passthrough, bool, S_IRUGO);
24 MODULE_PARM_DESC(passthrough,
25 "Option to specify how to export PCI topology to guest:\n"\
26 " 0 - (default) Hide the true PCI topology and makes the frontend\n"\
27 " there is a single PCI bus with only the exported devices on it.\n"\
28 " For example, a device at 03:05.0 will be re-assigned to 00:00.0\n"\
29 " while second device at 02:1a.1 will be re-assigned to 00:01.1.\n"\
30 " 1 - Passthrough provides a real view of the PCI topology to the\n"\
31 " frontend (for example, a device at 06:01.b will still appear at\n"\
32 " 06:01.b to the frontend). This is similar to how Xen 2.0.x\n"\
33 " exposed PCI devices to its driver domains. This may be required\n"\
34 " for drivers which depend on finding their hardward in certain\n"\
35 " bus/slot locations.");
37 static struct xen_pcibk_device *alloc_pdev(struct xenbus_device *xdev)
39 struct xen_pcibk_device *pdev;
41 pdev = kzalloc(sizeof(struct xen_pcibk_device), GFP_KERNEL);
42 if (pdev == NULL)
43 goto out;
44 dev_dbg(&xdev->dev, "allocated pdev @ 0x%p\n", pdev);
46 pdev->xdev = xdev;
48 mutex_init(&pdev->dev_lock);
50 pdev->sh_info = NULL;
51 pdev->evtchn_irq = INVALID_EVTCHN_IRQ;
52 pdev->be_watching = 0;
54 INIT_WORK(&pdev->op_work, xen_pcibk_do_op);
56 if (xen_pcibk_init_devices(pdev)) {
57 kfree(pdev);
58 pdev = NULL;
61 dev_set_drvdata(&xdev->dev, pdev);
63 out:
64 return pdev;
67 static void xen_pcibk_disconnect(struct xen_pcibk_device *pdev)
69 mutex_lock(&pdev->dev_lock);
70 /* Ensure the guest can't trigger our handler before removing devices */
71 if (pdev->evtchn_irq != INVALID_EVTCHN_IRQ) {
72 unbind_from_irqhandler(pdev->evtchn_irq, pdev);
73 pdev->evtchn_irq = INVALID_EVTCHN_IRQ;
76 /* If the driver domain started an op, make sure we complete it
77 * before releasing the shared memory */
79 /* Note, the workqueue does not use spinlocks at all.*/
80 flush_workqueue(xen_pcibk_wq);
82 if (pdev->sh_info != NULL) {
83 xenbus_unmap_ring_vfree(pdev->xdev, pdev->sh_info);
84 pdev->sh_info = NULL;
86 mutex_unlock(&pdev->dev_lock);
89 static void free_pdev(struct xen_pcibk_device *pdev)
91 if (pdev->be_watching) {
92 unregister_xenbus_watch(&pdev->be_watch);
93 pdev->be_watching = 0;
96 xen_pcibk_disconnect(pdev);
98 /* N.B. This calls pcistub_put_pci_dev which does the FLR on all
99 * of the PCIe devices. */
100 xen_pcibk_release_devices(pdev);
102 dev_set_drvdata(&pdev->xdev->dev, NULL);
103 pdev->xdev = NULL;
105 kfree(pdev);
108 static int xen_pcibk_do_attach(struct xen_pcibk_device *pdev, int gnt_ref,
109 int remote_evtchn)
111 int err = 0;
112 void *vaddr;
114 dev_dbg(&pdev->xdev->dev,
115 "Attaching to frontend resources - gnt_ref=%d evtchn=%d\n",
116 gnt_ref, remote_evtchn);
118 err = xenbus_map_ring_valloc(pdev->xdev, &gnt_ref, 1, &vaddr);
119 if (err < 0) {
120 xenbus_dev_fatal(pdev->xdev, err,
121 "Error mapping other domain page in ours.");
122 goto out;
125 pdev->sh_info = vaddr;
127 err = bind_interdomain_evtchn_to_irqhandler(
128 pdev->xdev->otherend_id, remote_evtchn, xen_pcibk_handle_event,
129 0, DRV_NAME, pdev);
130 if (err < 0) {
131 xenbus_dev_fatal(pdev->xdev, err,
132 "Error binding event channel to IRQ");
133 goto out;
135 pdev->evtchn_irq = err;
136 err = 0;
138 dev_dbg(&pdev->xdev->dev, "Attached!\n");
139 out:
140 return err;
143 static int xen_pcibk_attach(struct xen_pcibk_device *pdev)
145 int err = 0;
146 int gnt_ref, remote_evtchn;
147 char *magic = NULL;
150 mutex_lock(&pdev->dev_lock);
151 /* Make sure we only do this setup once */
152 if (xenbus_read_driver_state(pdev->xdev->nodename) !=
153 XenbusStateInitialised)
154 goto out;
156 /* Wait for frontend to state that it has published the configuration */
157 if (xenbus_read_driver_state(pdev->xdev->otherend) !=
158 XenbusStateInitialised)
159 goto out;
161 dev_dbg(&pdev->xdev->dev, "Reading frontend config\n");
163 err = xenbus_gather(XBT_NIL, pdev->xdev->otherend,
164 "pci-op-ref", "%u", &gnt_ref,
165 "event-channel", "%u", &remote_evtchn,
166 "magic", NULL, &magic, NULL);
167 if (err) {
168 /* If configuration didn't get read correctly, wait longer */
169 xenbus_dev_fatal(pdev->xdev, err,
170 "Error reading configuration from frontend");
171 goto out;
174 if (magic == NULL || strcmp(magic, XEN_PCI_MAGIC) != 0) {
175 xenbus_dev_fatal(pdev->xdev, -EFAULT,
176 "version mismatch (%s/%s) with pcifront - "
177 "halting " DRV_NAME,
178 magic, XEN_PCI_MAGIC);
179 err = -EFAULT;
180 goto out;
183 err = xen_pcibk_do_attach(pdev, gnt_ref, remote_evtchn);
184 if (err)
185 goto out;
187 dev_dbg(&pdev->xdev->dev, "Connecting...\n");
189 err = xenbus_switch_state(pdev->xdev, XenbusStateConnected);
190 if (err)
191 xenbus_dev_fatal(pdev->xdev, err,
192 "Error switching to connected state!");
194 dev_dbg(&pdev->xdev->dev, "Connected? %d\n", err);
195 out:
196 mutex_unlock(&pdev->dev_lock);
198 kfree(magic);
200 return err;
203 static int xen_pcibk_publish_pci_dev(struct xen_pcibk_device *pdev,
204 unsigned int domain, unsigned int bus,
205 unsigned int devfn, unsigned int devid)
207 int err;
208 int len;
209 char str[64];
211 len = snprintf(str, sizeof(str), "vdev-%d", devid);
212 if (unlikely(len >= (sizeof(str) - 1))) {
213 err = -ENOMEM;
214 goto out;
217 /* Note: The PV protocol uses %02x, don't change it */
218 err = xenbus_printf(XBT_NIL, pdev->xdev->nodename, str,
219 "%04x:%02x:%02x.%02x", domain, bus,
220 PCI_SLOT(devfn), PCI_FUNC(devfn));
222 out:
223 return err;
226 static int xen_pcibk_export_device(struct xen_pcibk_device *pdev,
227 int domain, int bus, int slot, int func,
228 int devid)
230 struct pci_dev *dev;
231 int err = 0;
233 dev_dbg(&pdev->xdev->dev, "exporting dom %x bus %x slot %x func %x\n",
234 domain, bus, slot, func);
236 dev = pcistub_get_pci_dev_by_slot(pdev, domain, bus, slot, func);
237 if (!dev) {
238 err = -EINVAL;
239 xenbus_dev_fatal(pdev->xdev, err,
240 "Couldn't locate PCI device "
241 "(%04x:%02x:%02x.%d)! "
242 "perhaps already in-use?",
243 domain, bus, slot, func);
244 goto out;
247 err = xen_pcibk_add_pci_dev(pdev, dev, devid,
248 xen_pcibk_publish_pci_dev);
249 if (err)
250 goto out;
252 dev_info(&dev->dev, "registering for %d\n", pdev->xdev->otherend_id);
253 if (xen_register_device_domain_owner(dev,
254 pdev->xdev->otherend_id) != 0) {
255 dev_err(&dev->dev, "Stealing ownership from dom%d.\n",
256 xen_find_device_domain_owner(dev));
257 xen_unregister_device_domain_owner(dev);
258 xen_register_device_domain_owner(dev, pdev->xdev->otherend_id);
261 /* TODO: It'd be nice to export a bridge and have all of its children
262 * get exported with it. This may be best done in xend (which will
263 * have to calculate resource usage anyway) but we probably want to
264 * put something in here to ensure that if a bridge gets given to a
265 * driver domain, that all devices under that bridge are not given
266 * to other driver domains (as he who controls the bridge can disable
267 * it and stop the other devices from working).
269 out:
270 return err;
273 static int xen_pcibk_remove_device(struct xen_pcibk_device *pdev,
274 int domain, int bus, int slot, int func)
276 int err = 0;
277 struct pci_dev *dev;
279 dev_dbg(&pdev->xdev->dev, "removing dom %x bus %x slot %x func %x\n",
280 domain, bus, slot, func);
282 dev = xen_pcibk_get_pci_dev(pdev, domain, bus, PCI_DEVFN(slot, func));
283 if (!dev) {
284 err = -EINVAL;
285 dev_dbg(&pdev->xdev->dev, "Couldn't locate PCI device "
286 "(%04x:%02x:%02x.%d)! not owned by this domain\n",
287 domain, bus, slot, func);
288 goto out;
291 dev_dbg(&dev->dev, "unregistering for %d\n", pdev->xdev->otherend_id);
292 xen_unregister_device_domain_owner(dev);
294 /* N.B. This ends up calling pcistub_put_pci_dev which ends up
295 * doing the FLR. */
296 xen_pcibk_release_pci_dev(pdev, dev, true /* use the lock. */);
298 out:
299 return err;
302 static int xen_pcibk_publish_pci_root(struct xen_pcibk_device *pdev,
303 unsigned int domain, unsigned int bus)
305 unsigned int d, b;
306 int i, root_num, len, err;
307 char str[64];
309 dev_dbg(&pdev->xdev->dev, "Publishing pci roots\n");
311 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename,
312 "root_num", "%d", &root_num);
313 if (err == 0 || err == -ENOENT)
314 root_num = 0;
315 else if (err < 0)
316 goto out;
318 /* Verify that we haven't already published this pci root */
319 for (i = 0; i < root_num; i++) {
320 len = snprintf(str, sizeof(str), "root-%d", i);
321 if (unlikely(len >= (sizeof(str) - 1))) {
322 err = -ENOMEM;
323 goto out;
326 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename,
327 str, "%x:%x", &d, &b);
328 if (err < 0)
329 goto out;
330 if (err != 2) {
331 err = -EINVAL;
332 goto out;
335 if (d == domain && b == bus) {
336 err = 0;
337 goto out;
341 len = snprintf(str, sizeof(str), "root-%d", root_num);
342 if (unlikely(len >= (sizeof(str) - 1))) {
343 err = -ENOMEM;
344 goto out;
347 dev_dbg(&pdev->xdev->dev, "writing root %d at %04x:%02x\n",
348 root_num, domain, bus);
350 err = xenbus_printf(XBT_NIL, pdev->xdev->nodename, str,
351 "%04x:%02x", domain, bus);
352 if (err)
353 goto out;
355 err = xenbus_printf(XBT_NIL, pdev->xdev->nodename,
356 "root_num", "%d", (root_num + 1));
358 out:
359 return err;
362 static int xen_pcibk_reconfigure(struct xen_pcibk_device *pdev)
364 int err = 0;
365 int num_devs;
366 int domain, bus, slot, func;
367 int substate;
368 int i, len;
369 char state_str[64];
370 char dev_str[64];
373 dev_dbg(&pdev->xdev->dev, "Reconfiguring device ...\n");
375 mutex_lock(&pdev->dev_lock);
376 /* Make sure we only reconfigure once */
377 if (xenbus_read_driver_state(pdev->xdev->nodename) !=
378 XenbusStateReconfiguring)
379 goto out;
381 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename, "num_devs", "%d",
382 &num_devs);
383 if (err != 1) {
384 if (err >= 0)
385 err = -EINVAL;
386 xenbus_dev_fatal(pdev->xdev, err,
387 "Error reading number of devices");
388 goto out;
391 for (i = 0; i < num_devs; i++) {
392 len = snprintf(state_str, sizeof(state_str), "state-%d", i);
393 if (unlikely(len >= (sizeof(state_str) - 1))) {
394 err = -ENOMEM;
395 xenbus_dev_fatal(pdev->xdev, err,
396 "String overflow while reading "
397 "configuration");
398 goto out;
400 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename, state_str,
401 "%d", &substate);
402 if (err != 1)
403 substate = XenbusStateUnknown;
405 switch (substate) {
406 case XenbusStateInitialising:
407 dev_dbg(&pdev->xdev->dev, "Attaching dev-%d ...\n", i);
409 len = snprintf(dev_str, sizeof(dev_str), "dev-%d", i);
410 if (unlikely(len >= (sizeof(dev_str) - 1))) {
411 err = -ENOMEM;
412 xenbus_dev_fatal(pdev->xdev, err,
413 "String overflow while "
414 "reading configuration");
415 goto out;
417 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename,
418 dev_str, "%x:%x:%x.%x",
419 &domain, &bus, &slot, &func);
420 if (err < 0) {
421 xenbus_dev_fatal(pdev->xdev, err,
422 "Error reading device "
423 "configuration");
424 goto out;
426 if (err != 4) {
427 err = -EINVAL;
428 xenbus_dev_fatal(pdev->xdev, err,
429 "Error parsing pci device "
430 "configuration");
431 goto out;
434 err = xen_pcibk_export_device(pdev, domain, bus, slot,
435 func, i);
436 if (err)
437 goto out;
439 /* Publish pci roots. */
440 err = xen_pcibk_publish_pci_roots(pdev,
441 xen_pcibk_publish_pci_root);
442 if (err) {
443 xenbus_dev_fatal(pdev->xdev, err,
444 "Error while publish PCI root"
445 "buses for frontend");
446 goto out;
449 err = xenbus_printf(XBT_NIL, pdev->xdev->nodename,
450 state_str, "%d",
451 XenbusStateInitialised);
452 if (err) {
453 xenbus_dev_fatal(pdev->xdev, err,
454 "Error switching substate of "
455 "dev-%d\n", i);
456 goto out;
458 break;
460 case XenbusStateClosing:
461 dev_dbg(&pdev->xdev->dev, "Detaching dev-%d ...\n", i);
463 len = snprintf(dev_str, sizeof(dev_str), "vdev-%d", i);
464 if (unlikely(len >= (sizeof(dev_str) - 1))) {
465 err = -ENOMEM;
466 xenbus_dev_fatal(pdev->xdev, err,
467 "String overflow while "
468 "reading configuration");
469 goto out;
471 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename,
472 dev_str, "%x:%x:%x.%x",
473 &domain, &bus, &slot, &func);
474 if (err < 0) {
475 xenbus_dev_fatal(pdev->xdev, err,
476 "Error reading device "
477 "configuration");
478 goto out;
480 if (err != 4) {
481 err = -EINVAL;
482 xenbus_dev_fatal(pdev->xdev, err,
483 "Error parsing pci device "
484 "configuration");
485 goto out;
488 err = xen_pcibk_remove_device(pdev, domain, bus, slot,
489 func);
490 if (err)
491 goto out;
493 /* TODO: If at some point we implement support for pci
494 * root hot-remove on pcifront side, we'll need to
495 * remove unnecessary xenstore nodes of pci roots here.
498 break;
500 default:
501 break;
505 err = xenbus_switch_state(pdev->xdev, XenbusStateReconfigured);
506 if (err) {
507 xenbus_dev_fatal(pdev->xdev, err,
508 "Error switching to reconfigured state!");
509 goto out;
512 out:
513 mutex_unlock(&pdev->dev_lock);
514 return 0;
517 static void xen_pcibk_frontend_changed(struct xenbus_device *xdev,
518 enum xenbus_state fe_state)
520 struct xen_pcibk_device *pdev = dev_get_drvdata(&xdev->dev);
522 dev_dbg(&xdev->dev, "fe state changed %d\n", fe_state);
524 switch (fe_state) {
525 case XenbusStateInitialised:
526 xen_pcibk_attach(pdev);
527 break;
529 case XenbusStateReconfiguring:
530 xen_pcibk_reconfigure(pdev);
531 break;
533 case XenbusStateConnected:
534 /* pcifront switched its state from reconfiguring to connected.
535 * Then switch to connected state.
537 xenbus_switch_state(xdev, XenbusStateConnected);
538 break;
540 case XenbusStateClosing:
541 xen_pcibk_disconnect(pdev);
542 xenbus_switch_state(xdev, XenbusStateClosing);
543 break;
545 case XenbusStateClosed:
546 xen_pcibk_disconnect(pdev);
547 xenbus_switch_state(xdev, XenbusStateClosed);
548 if (xenbus_dev_is_online(xdev))
549 break;
550 /* fall through if not online */
551 case XenbusStateUnknown:
552 dev_dbg(&xdev->dev, "frontend is gone! unregister device\n");
553 device_unregister(&xdev->dev);
554 break;
556 default:
557 break;
561 static int xen_pcibk_setup_backend(struct xen_pcibk_device *pdev)
563 /* Get configuration from xend (if available now) */
564 int domain, bus, slot, func;
565 int err = 0;
566 int i, num_devs;
567 char dev_str[64];
568 char state_str[64];
570 mutex_lock(&pdev->dev_lock);
571 /* It's possible we could get the call to setup twice, so make sure
572 * we're not already connected.
574 if (xenbus_read_driver_state(pdev->xdev->nodename) !=
575 XenbusStateInitWait)
576 goto out;
578 dev_dbg(&pdev->xdev->dev, "getting be setup\n");
580 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename, "num_devs", "%d",
581 &num_devs);
582 if (err != 1) {
583 if (err >= 0)
584 err = -EINVAL;
585 xenbus_dev_fatal(pdev->xdev, err,
586 "Error reading number of devices");
587 goto out;
590 for (i = 0; i < num_devs; i++) {
591 int l = snprintf(dev_str, sizeof(dev_str), "dev-%d", i);
592 if (unlikely(l >= (sizeof(dev_str) - 1))) {
593 err = -ENOMEM;
594 xenbus_dev_fatal(pdev->xdev, err,
595 "String overflow while reading "
596 "configuration");
597 goto out;
600 err = xenbus_scanf(XBT_NIL, pdev->xdev->nodename, dev_str,
601 "%x:%x:%x.%x", &domain, &bus, &slot, &func);
602 if (err < 0) {
603 xenbus_dev_fatal(pdev->xdev, err,
604 "Error reading device configuration");
605 goto out;
607 if (err != 4) {
608 err = -EINVAL;
609 xenbus_dev_fatal(pdev->xdev, err,
610 "Error parsing pci device "
611 "configuration");
612 goto out;
615 err = xen_pcibk_export_device(pdev, domain, bus, slot, func, i);
616 if (err)
617 goto out;
619 /* Switch substate of this device. */
620 l = snprintf(state_str, sizeof(state_str), "state-%d", i);
621 if (unlikely(l >= (sizeof(state_str) - 1))) {
622 err = -ENOMEM;
623 xenbus_dev_fatal(pdev->xdev, err,
624 "String overflow while reading "
625 "configuration");
626 goto out;
628 err = xenbus_printf(XBT_NIL, pdev->xdev->nodename, state_str,
629 "%d", XenbusStateInitialised);
630 if (err) {
631 xenbus_dev_fatal(pdev->xdev, err, "Error switching "
632 "substate of dev-%d\n", i);
633 goto out;
637 err = xen_pcibk_publish_pci_roots(pdev, xen_pcibk_publish_pci_root);
638 if (err) {
639 xenbus_dev_fatal(pdev->xdev, err,
640 "Error while publish PCI root buses "
641 "for frontend");
642 goto out;
645 err = xenbus_switch_state(pdev->xdev, XenbusStateInitialised);
646 if (err)
647 xenbus_dev_fatal(pdev->xdev, err,
648 "Error switching to initialised state!");
650 out:
651 mutex_unlock(&pdev->dev_lock);
652 if (!err)
653 /* see if pcifront is already configured (if not, we'll wait) */
654 xen_pcibk_attach(pdev);
655 return err;
658 static void xen_pcibk_be_watch(struct xenbus_watch *watch,
659 const char **vec, unsigned int len)
661 struct xen_pcibk_device *pdev =
662 container_of(watch, struct xen_pcibk_device, be_watch);
664 switch (xenbus_read_driver_state(pdev->xdev->nodename)) {
665 case XenbusStateInitWait:
666 xen_pcibk_setup_backend(pdev);
667 break;
669 default:
670 break;
674 static int xen_pcibk_xenbus_probe(struct xenbus_device *dev,
675 const struct xenbus_device_id *id)
677 int err = 0;
678 struct xen_pcibk_device *pdev = alloc_pdev(dev);
680 if (pdev == NULL) {
681 err = -ENOMEM;
682 xenbus_dev_fatal(dev, err,
683 "Error allocating xen_pcibk_device struct");
684 goto out;
687 /* wait for xend to configure us */
688 err = xenbus_switch_state(dev, XenbusStateInitWait);
689 if (err)
690 goto out;
692 /* watch the backend node for backend configuration information */
693 err = xenbus_watch_path(dev, dev->nodename, &pdev->be_watch,
694 xen_pcibk_be_watch);
695 if (err)
696 goto out;
698 pdev->be_watching = 1;
700 /* We need to force a call to our callback here in case
701 * xend already configured us!
703 xen_pcibk_be_watch(&pdev->be_watch, NULL, 0);
705 out:
706 return err;
709 static int xen_pcibk_xenbus_remove(struct xenbus_device *dev)
711 struct xen_pcibk_device *pdev = dev_get_drvdata(&dev->dev);
713 if (pdev != NULL)
714 free_pdev(pdev);
716 return 0;
719 static const struct xenbus_device_id xen_pcibk_ids[] = {
720 {"pci"},
721 {""},
724 static struct xenbus_driver xen_pcibk_driver = {
725 .name = DRV_NAME,
726 .ids = xen_pcibk_ids,
727 .probe = xen_pcibk_xenbus_probe,
728 .remove = xen_pcibk_xenbus_remove,
729 .otherend_changed = xen_pcibk_frontend_changed,
732 const struct xen_pcibk_backend *__read_mostly xen_pcibk_backend;
734 int __init xen_pcibk_xenbus_register(void)
736 xen_pcibk_wq = create_workqueue("xen_pciback_workqueue");
737 if (!xen_pcibk_wq) {
738 pr_err("%s: create xen_pciback_workqueue failed\n", __func__);
739 return -EFAULT;
741 xen_pcibk_backend = &xen_pcibk_vpci_backend;
742 if (passthrough)
743 xen_pcibk_backend = &xen_pcibk_passthrough_backend;
744 pr_info("backend is %s\n", xen_pcibk_backend->name);
745 return xenbus_register_backend(&xen_pcibk_driver);
748 void __exit xen_pcibk_xenbus_unregister(void)
750 destroy_workqueue(xen_pcibk_wq);
751 xenbus_unregister_driver(&xen_pcibk_driver);