2 * Copyright 2014 IBM Corp.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
10 #include <linux/spinlock.h>
11 #include <linux/module.h>
12 #include <linux/export.h>
13 #include <linux/kernel.h>
14 #include <linux/bitmap.h>
15 #include <linux/sched/signal.h>
16 #include <linux/poll.h>
17 #include <linux/pid.h>
20 #include <linux/slab.h>
21 #include <linux/sched/mm.h>
22 #include <linux/mmu_context.h>
23 #include <asm/cputable.h>
24 #include <asm/current.h>
25 #include <asm/copro.h>
30 #define CXL_NUM_MINORS 256 /* Total to reserve */
32 #define CXL_AFU_MINOR_D(afu) (CXL_CARD_MINOR(afu->adapter) + 1 + (3 * afu->slice))
33 #define CXL_AFU_MINOR_M(afu) (CXL_AFU_MINOR_D(afu) + 1)
34 #define CXL_AFU_MINOR_S(afu) (CXL_AFU_MINOR_D(afu) + 2)
35 #define CXL_AFU_MKDEV_D(afu) MKDEV(MAJOR(cxl_dev), CXL_AFU_MINOR_D(afu))
36 #define CXL_AFU_MKDEV_M(afu) MKDEV(MAJOR(cxl_dev), CXL_AFU_MINOR_M(afu))
37 #define CXL_AFU_MKDEV_S(afu) MKDEV(MAJOR(cxl_dev), CXL_AFU_MINOR_S(afu))
39 #define CXL_DEVT_AFU(dev) ((MINOR(dev) % CXL_DEV_MINORS - 1) / 3)
41 #define CXL_DEVT_IS_CARD(dev) (MINOR(dev) % CXL_DEV_MINORS == 0)
45 static struct class *cxl_class
;
47 static int __afu_open(struct inode
*inode
, struct file
*file
, bool master
)
51 struct cxl_context
*ctx
;
52 int adapter_num
= CXL_DEVT_ADAPTER(inode
->i_rdev
);
53 int slice
= CXL_DEVT_AFU(inode
->i_rdev
);
56 pr_devel("afu_open afu%i.%i\n", slice
, adapter_num
);
58 if (!(adapter
= get_cxl_adapter(adapter_num
)))
61 if (slice
> adapter
->slices
)
64 spin_lock(&adapter
->afu_list_lock
);
65 if (!(afu
= adapter
->afu
[slice
])) {
66 spin_unlock(&adapter
->afu_list_lock
);
71 * taking a ref to the afu so that it doesn't go away
72 * for rest of the function. This ref is released before
76 spin_unlock(&adapter
->afu_list_lock
);
78 if (!afu
->current_mode
)
81 if (!cxl_ops
->link_ok(adapter
, afu
)) {
86 if (!(ctx
= cxl_context_alloc())) {
91 rc
= cxl_context_init(ctx
, afu
, master
);
95 cxl_context_set_mapping(ctx
, inode
->i_mapping
);
97 pr_devel("afu_open pe: %i\n", ctx
->pe
);
98 file
->private_data
= ctx
;
100 /* indicate success */
104 /* release the ref taken earlier */
107 put_device(&adapter
->dev
);
111 int afu_open(struct inode
*inode
, struct file
*file
)
113 return __afu_open(inode
, file
, false);
116 static int afu_master_open(struct inode
*inode
, struct file
*file
)
118 return __afu_open(inode
, file
, true);
121 int afu_release(struct inode
*inode
, struct file
*file
)
123 struct cxl_context
*ctx
= file
->private_data
;
125 pr_devel("%s: closing cxl file descriptor. pe: %i\n",
127 cxl_context_detach(ctx
);
131 * Delete the context's mapping pointer, unless it's created by the
132 * kernel API, in which case leave it so it can be freed by reclaim_ctx()
134 if (!ctx
->kernelapi
) {
135 mutex_lock(&ctx
->mapping_lock
);
137 mutex_unlock(&ctx
->mapping_lock
);
141 * At this this point all bottom halfs have finished and we should be
142 * getting no more IRQs from the hardware for this context. Once it's
143 * removed from the IDR (and RCU synchronised) it's safe to free the
146 cxl_context_free(ctx
);
151 static long afu_ioctl_start_work(struct cxl_context
*ctx
,
152 struct cxl_ioctl_start_work __user
*uwork
)
154 struct cxl_ioctl_start_work work
;
158 pr_devel("%s: pe: %i\n", __func__
, ctx
->pe
);
160 /* Do this outside the status_mutex to avoid a circular dependency with
161 * the locking in cxl_mmap_fault() */
162 if (copy_from_user(&work
, uwork
, sizeof(work
)))
165 mutex_lock(&ctx
->status_mutex
);
166 if (ctx
->status
!= OPENED
) {
172 * if any of the reserved fields are set or any of the unused
173 * flags are set it's invalid
175 if (work
.reserved1
|| work
.reserved2
|| work
.reserved3
||
176 work
.reserved4
|| work
.reserved5
||
177 (work
.flags
& ~CXL_START_WORK_ALL
)) {
182 if (!(work
.flags
& CXL_START_WORK_NUM_IRQS
))
183 work
.num_interrupts
= ctx
->afu
->pp_irqs
;
184 else if ((work
.num_interrupts
< ctx
->afu
->pp_irqs
) ||
185 (work
.num_interrupts
> ctx
->afu
->irqs_max
)) {
190 if ((rc
= afu_register_irqs(ctx
, work
.num_interrupts
)))
193 if (work
.flags
& CXL_START_WORK_AMR
)
194 amr
= work
.amr
& mfspr(SPRN_UAMOR
);
196 if (work
.flags
& CXL_START_WORK_TID
)
197 ctx
->assign_tidr
= true;
199 ctx
->mmio_err_ff
= !!(work
.flags
& CXL_START_WORK_ERR_FF
);
202 * Increment the mapped context count for adapter. This also checks
203 * if adapter_context_lock is taken.
205 rc
= cxl_adapter_context_get(ctx
->afu
->adapter
);
207 afu_release_irqs(ctx
, ctx
);
212 * We grab the PID here and not in the file open to allow for the case
213 * where a process (master, some daemon, etc) has opened the chardev on
214 * behalf of another process, so the AFU's mm gets bound to the process
215 * that performs this ioctl and not the process that opened the file.
216 * Also we grab the PID of the group leader so that if the task that
217 * has performed the attach operation exits the mm context of the
218 * process is still accessible.
220 ctx
->pid
= get_task_pid(current
, PIDTYPE_PID
);
222 /* acquire a reference to the task's mm */
223 ctx
->mm
= get_task_mm(current
);
225 /* ensure this mm_struct can't be freed */
226 cxl_context_mm_count_get(ctx
);
229 /* decrement the use count from above */
231 /* make TLBIs for this context global */
232 mm_context_add_copro(ctx
->mm
);
236 * Increment driver use count. Enables global TLBIs for hash
237 * and callbacks to handle the segment table
242 * A barrier is needed to make sure all TLBIs are global
243 * before we attach and the context starts being used by the
246 * Needed after mm_context_add_copro() for radix and
247 * cxl_ctx_get() for hash/p8.
249 * The barrier should really be mb(), since it involves a
250 * device. However, it's only useful when we have local
251 * vs. global TLBIs, i.e SMP=y. So keep smp_mb().
255 trace_cxl_attach(ctx
, work
.work_element_descriptor
, work
.num_interrupts
, amr
);
257 if ((rc
= cxl_ops
->attach_process(ctx
, false, work
.work_element_descriptor
,
259 afu_release_irqs(ctx
, ctx
);
260 cxl_adapter_context_put(ctx
->afu
->adapter
);
264 cxl_context_mm_count_put(ctx
);
266 mm_context_remove_copro(ctx
->mm
);
271 if (work
.flags
& CXL_START_WORK_TID
) {
272 work
.tid
= ctx
->tidr
;
273 if (copy_to_user(uwork
, &work
, sizeof(work
)))
277 ctx
->status
= STARTED
;
280 mutex_unlock(&ctx
->status_mutex
);
284 static long afu_ioctl_process_element(struct cxl_context
*ctx
,
287 pr_devel("%s: pe: %i\n", __func__
, ctx
->pe
);
289 if (copy_to_user(upe
, &ctx
->external_pe
, sizeof(__u32
)))
295 static long afu_ioctl_get_afu_id(struct cxl_context
*ctx
,
296 struct cxl_afu_id __user
*upafuid
)
298 struct cxl_afu_id afuid
= { 0 };
300 afuid
.card_id
= ctx
->afu
->adapter
->adapter_num
;
301 afuid
.afu_offset
= ctx
->afu
->slice
;
302 afuid
.afu_mode
= ctx
->afu
->current_mode
;
304 /* set the flag bit in case the afu is a slave */
305 if (ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
&& !ctx
->master
)
306 afuid
.flags
|= CXL_AFUID_FLAG_SLAVE
;
308 if (copy_to_user(upafuid
, &afuid
, sizeof(afuid
)))
314 long afu_ioctl(struct file
*file
, unsigned int cmd
, unsigned long arg
)
316 struct cxl_context
*ctx
= file
->private_data
;
318 if (ctx
->status
== CLOSED
)
321 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
324 pr_devel("afu_ioctl\n");
326 case CXL_IOCTL_START_WORK
:
327 return afu_ioctl_start_work(ctx
, (struct cxl_ioctl_start_work __user
*)arg
);
328 case CXL_IOCTL_GET_PROCESS_ELEMENT
:
329 return afu_ioctl_process_element(ctx
, (__u32 __user
*)arg
);
330 case CXL_IOCTL_GET_AFU_ID
:
331 return afu_ioctl_get_afu_id(ctx
, (struct cxl_afu_id __user
*)
337 static long afu_compat_ioctl(struct file
*file
, unsigned int cmd
,
340 return afu_ioctl(file
, cmd
, arg
);
343 int afu_mmap(struct file
*file
, struct vm_area_struct
*vm
)
345 struct cxl_context
*ctx
= file
->private_data
;
347 /* AFU must be started before we can MMIO */
348 if (ctx
->status
!= STARTED
)
351 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
354 return cxl_context_iomap(ctx
, vm
);
357 static inline bool ctx_event_pending(struct cxl_context
*ctx
)
359 if (ctx
->pending_irq
|| ctx
->pending_fault
|| ctx
->pending_afu_err
)
362 if (ctx
->afu_driver_ops
&& atomic_read(&ctx
->afu_driver_events
))
368 __poll_t
afu_poll(struct file
*file
, struct poll_table_struct
*poll
)
370 struct cxl_context
*ctx
= file
->private_data
;
375 poll_wait(file
, &ctx
->wq
, poll
);
377 pr_devel("afu_poll wait done pe: %i\n", ctx
->pe
);
379 spin_lock_irqsave(&ctx
->lock
, flags
);
380 if (ctx_event_pending(ctx
))
381 mask
|= EPOLLIN
| EPOLLRDNORM
;
382 else if (ctx
->status
== CLOSED
)
383 /* Only error on closed when there are no futher events pending
386 spin_unlock_irqrestore(&ctx
->lock
, flags
);
388 pr_devel("afu_poll pe: %i returning %#x\n", ctx
->pe
, mask
);
393 static ssize_t
afu_driver_event_copy(struct cxl_context
*ctx
,
395 struct cxl_event
*event
,
396 struct cxl_event_afu_driver_reserved
*pl
)
400 ctx
->afu_driver_ops
->event_delivered(ctx
, pl
, -EINVAL
);
404 /* Check event size */
405 event
->header
.size
+= pl
->data_size
;
406 if (event
->header
.size
> CXL_READ_MIN_SIZE
) {
407 ctx
->afu_driver_ops
->event_delivered(ctx
, pl
, -EINVAL
);
411 /* Copy event header */
412 if (copy_to_user(buf
, event
, sizeof(struct cxl_event_header
))) {
413 ctx
->afu_driver_ops
->event_delivered(ctx
, pl
, -EFAULT
);
417 /* Copy event data */
418 buf
+= sizeof(struct cxl_event_header
);
419 if (copy_to_user(buf
, &pl
->data
, pl
->data_size
)) {
420 ctx
->afu_driver_ops
->event_delivered(ctx
, pl
, -EFAULT
);
424 ctx
->afu_driver_ops
->event_delivered(ctx
, pl
, 0); /* Success */
425 return event
->header
.size
;
428 ssize_t
afu_read(struct file
*file
, char __user
*buf
, size_t count
,
431 struct cxl_context
*ctx
= file
->private_data
;
432 struct cxl_event_afu_driver_reserved
*pl
= NULL
;
433 struct cxl_event event
;
438 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
441 if (count
< CXL_READ_MIN_SIZE
)
444 spin_lock_irqsave(&ctx
->lock
, flags
);
447 prepare_to_wait(&ctx
->wq
, &wait
, TASK_INTERRUPTIBLE
);
448 if (ctx_event_pending(ctx
) || (ctx
->status
== CLOSED
))
451 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
456 if (file
->f_flags
& O_NONBLOCK
) {
461 if (signal_pending(current
)) {
466 spin_unlock_irqrestore(&ctx
->lock
, flags
);
467 pr_devel("afu_read going to sleep...\n");
469 pr_devel("afu_read woken up\n");
470 spin_lock_irqsave(&ctx
->lock
, flags
);
473 finish_wait(&ctx
->wq
, &wait
);
475 memset(&event
, 0, sizeof(event
));
476 event
.header
.process_element
= ctx
->pe
;
477 event
.header
.size
= sizeof(struct cxl_event_header
);
478 if (ctx
->afu_driver_ops
&& atomic_read(&ctx
->afu_driver_events
)) {
479 pr_devel("afu_read delivering AFU driver specific event\n");
480 pl
= ctx
->afu_driver_ops
->fetch_event(ctx
);
481 atomic_dec(&ctx
->afu_driver_events
);
482 event
.header
.type
= CXL_EVENT_AFU_DRIVER
;
483 } else if (ctx
->pending_irq
) {
484 pr_devel("afu_read delivering AFU interrupt\n");
485 event
.header
.size
+= sizeof(struct cxl_event_afu_interrupt
);
486 event
.header
.type
= CXL_EVENT_AFU_INTERRUPT
;
487 event
.irq
.irq
= find_first_bit(ctx
->irq_bitmap
, ctx
->irq_count
) + 1;
488 clear_bit(event
.irq
.irq
- 1, ctx
->irq_bitmap
);
489 if (bitmap_empty(ctx
->irq_bitmap
, ctx
->irq_count
))
490 ctx
->pending_irq
= false;
491 } else if (ctx
->pending_fault
) {
492 pr_devel("afu_read delivering data storage fault\n");
493 event
.header
.size
+= sizeof(struct cxl_event_data_storage
);
494 event
.header
.type
= CXL_EVENT_DATA_STORAGE
;
495 event
.fault
.addr
= ctx
->fault_addr
;
496 event
.fault
.dsisr
= ctx
->fault_dsisr
;
497 ctx
->pending_fault
= false;
498 } else if (ctx
->pending_afu_err
) {
499 pr_devel("afu_read delivering afu error\n");
500 event
.header
.size
+= sizeof(struct cxl_event_afu_error
);
501 event
.header
.type
= CXL_EVENT_AFU_ERROR
;
502 event
.afu_error
.error
= ctx
->afu_err
;
503 ctx
->pending_afu_err
= false;
504 } else if (ctx
->status
== CLOSED
) {
505 pr_devel("afu_read fatal error\n");
506 spin_unlock_irqrestore(&ctx
->lock
, flags
);
509 WARN(1, "afu_read must be buggy\n");
511 spin_unlock_irqrestore(&ctx
->lock
, flags
);
513 if (event
.header
.type
== CXL_EVENT_AFU_DRIVER
)
514 return afu_driver_event_copy(ctx
, buf
, &event
, pl
);
516 if (copy_to_user(buf
, &event
, event
.header
.size
))
518 return event
.header
.size
;
521 finish_wait(&ctx
->wq
, &wait
);
522 spin_unlock_irqrestore(&ctx
->lock
, flags
);
527 * Note: if this is updated, we need to update api.c to patch the new ones in
530 const struct file_operations afu_fops
= {
531 .owner
= THIS_MODULE
,
535 .release
= afu_release
,
536 .unlocked_ioctl
= afu_ioctl
,
537 .compat_ioctl
= afu_compat_ioctl
,
541 static const struct file_operations afu_master_fops
= {
542 .owner
= THIS_MODULE
,
543 .open
= afu_master_open
,
546 .release
= afu_release
,
547 .unlocked_ioctl
= afu_ioctl
,
548 .compat_ioctl
= afu_compat_ioctl
,
553 static char *cxl_devnode(struct device
*dev
, umode_t
*mode
)
555 if (cpu_has_feature(CPU_FTR_HVMODE
) &&
556 CXL_DEVT_IS_CARD(dev
->devt
)) {
558 * These minor numbers will eventually be used to program the
559 * PSL and AFUs once we have dynamic reprogramming support
563 return kasprintf(GFP_KERNEL
, "cxl/%s", dev_name(dev
));
566 extern struct class *cxl_class
;
568 static int cxl_add_chardev(struct cxl_afu
*afu
, dev_t devt
, struct cdev
*cdev
,
569 struct device
**chardev
, char *postfix
, char *desc
,
570 const struct file_operations
*fops
)
575 cdev_init(cdev
, fops
);
576 if ((rc
= cdev_add(cdev
, devt
, 1))) {
577 dev_err(&afu
->dev
, "Unable to add %s chardev: %i\n", desc
, rc
);
581 dev
= device_create(cxl_class
, &afu
->dev
, devt
, afu
,
582 "afu%i.%i%s", afu
->adapter
->adapter_num
, afu
->slice
, postfix
);
584 dev_err(&afu
->dev
, "Unable to create %s chardev in sysfs: %i\n", desc
, rc
);
597 int cxl_chardev_d_afu_add(struct cxl_afu
*afu
)
599 return cxl_add_chardev(afu
, CXL_AFU_MKDEV_D(afu
), &afu
->afu_cdev_d
,
600 &afu
->chardev_d
, "d", "dedicated",
601 &afu_master_fops
); /* Uses master fops */
604 int cxl_chardev_m_afu_add(struct cxl_afu
*afu
)
606 return cxl_add_chardev(afu
, CXL_AFU_MKDEV_M(afu
), &afu
->afu_cdev_m
,
607 &afu
->chardev_m
, "m", "master",
611 int cxl_chardev_s_afu_add(struct cxl_afu
*afu
)
613 return cxl_add_chardev(afu
, CXL_AFU_MKDEV_S(afu
), &afu
->afu_cdev_s
,
614 &afu
->chardev_s
, "s", "shared",
618 void cxl_chardev_afu_remove(struct cxl_afu
*afu
)
620 if (afu
->chardev_d
) {
621 cdev_del(&afu
->afu_cdev_d
);
622 device_unregister(afu
->chardev_d
);
623 afu
->chardev_d
= NULL
;
625 if (afu
->chardev_m
) {
626 cdev_del(&afu
->afu_cdev_m
);
627 device_unregister(afu
->chardev_m
);
628 afu
->chardev_m
= NULL
;
630 if (afu
->chardev_s
) {
631 cdev_del(&afu
->afu_cdev_s
);
632 device_unregister(afu
->chardev_s
);
633 afu
->chardev_s
= NULL
;
637 int cxl_register_afu(struct cxl_afu
*afu
)
639 afu
->dev
.class = cxl_class
;
641 return device_register(&afu
->dev
);
644 int cxl_register_adapter(struct cxl
*adapter
)
646 adapter
->dev
.class = cxl_class
;
649 * Future: When we support dynamically reprogramming the PSL & AFU we
650 * will expose the interface to do that via a chardev:
651 * adapter->dev.devt = CXL_CARD_MKDEV(adapter);
654 return device_register(&adapter
->dev
);
657 dev_t
cxl_get_dev(void)
662 int __init
cxl_file_init(void)
667 * If these change we really need to update API. Either change some
668 * flags or update API version number CXL_API_VERSION.
670 BUILD_BUG_ON(CXL_API_VERSION
!= 3);
671 BUILD_BUG_ON(sizeof(struct cxl_ioctl_start_work
) != 64);
672 BUILD_BUG_ON(sizeof(struct cxl_event_header
) != 8);
673 BUILD_BUG_ON(sizeof(struct cxl_event_afu_interrupt
) != 8);
674 BUILD_BUG_ON(sizeof(struct cxl_event_data_storage
) != 32);
675 BUILD_BUG_ON(sizeof(struct cxl_event_afu_error
) != 16);
677 if ((rc
= alloc_chrdev_region(&cxl_dev
, 0, CXL_NUM_MINORS
, "cxl"))) {
678 pr_err("Unable to allocate CXL major number: %i\n", rc
);
682 pr_devel("CXL device allocated, MAJOR %i\n", MAJOR(cxl_dev
));
684 cxl_class
= class_create(THIS_MODULE
, "cxl");
685 if (IS_ERR(cxl_class
)) {
686 pr_err("Unable to create CXL class\n");
687 rc
= PTR_ERR(cxl_class
);
690 cxl_class
->devnode
= cxl_devnode
;
695 unregister_chrdev_region(cxl_dev
, CXL_NUM_MINORS
);
699 void cxl_file_exit(void)
701 unregister_chrdev_region(cxl_dev
, CXL_NUM_MINORS
);
702 class_destroy(cxl_class
);