1 // SPDX-License-Identifier: GPL-2.0+
2 // Copyright 2017 IBM Corp.
3 #include <linux/fs.h>
4 #include <linux/poll.h>
5 #include <linux/sched/signal.h>
6 #include <linux/eventfd.h>
7 #include <linux/uaccess.h>
8 #include <uapi/misc/ocxl.h>
9 #include <asm/reg.h>
10 #include <asm/switch_to.h>
11 #include "ocxl_internal.h"
12
13
14 #define OCXL_NUM_MINORS 256 /* Total to reserve */
15
16 static dev_t ocxl_dev;
17 static struct class *ocxl_class;
18 static struct mutex minors_idr_lock;
19 static struct idr minors_idr;
20
find_file_info(dev_t devno)21 static struct ocxl_file_info *find_file_info(dev_t devno)
22 {
23 struct ocxl_file_info *info;
24
25 /*
26 * We don't declare an RCU critical section here, as our AFU
27 * is protected by a reference counter on the device. By the time the
28 * info reference is removed from the idr, the ref count of
29 * the device is already at 0, so no user API will access that AFU and
30 * this function can't return it.
31 */
32 info = idr_find(&minors_idr, MINOR(devno));
33 return info;
34 }
35
allocate_minor(struct ocxl_file_info * info)36 static int allocate_minor(struct ocxl_file_info *info)
37 {
38 int minor;
39
40 mutex_lock(&minors_idr_lock);
41 minor = idr_alloc(&minors_idr, info, 0, OCXL_NUM_MINORS, GFP_KERNEL);
42 mutex_unlock(&minors_idr_lock);
43 return minor;
44 }
45
free_minor(struct ocxl_file_info * info)46 static void free_minor(struct ocxl_file_info *info)
47 {
48 mutex_lock(&minors_idr_lock);
49 idr_remove(&minors_idr, MINOR(info->dev.devt));
50 mutex_unlock(&minors_idr_lock);
51 }
52
afu_open(struct inode * inode,struct file * file)53 static int afu_open(struct inode *inode, struct file *file)
54 {
55 struct ocxl_file_info *info;
56 struct ocxl_context *ctx;
57 int rc;
58
59 pr_debug("%s for device %x\n", __func__, inode->i_rdev);
60
61 info = find_file_info(inode->i_rdev);
62 if (!info)
63 return -ENODEV;
64
65 rc = ocxl_context_alloc(&ctx, info->afu, inode->i_mapping);
66 if (rc)
67 return rc;
68
69 file->private_data = ctx;
70 return 0;
71 }
72
afu_ioctl_attach(struct ocxl_context * ctx,struct ocxl_ioctl_attach __user * uarg)73 static long afu_ioctl_attach(struct ocxl_context *ctx,
74 struct ocxl_ioctl_attach __user *uarg)
75 {
76 struct ocxl_ioctl_attach arg;
77 u64 amr = 0;
78 int rc;
79
80 pr_debug("%s for context %d\n", __func__, ctx->pasid);
81
82 if (copy_from_user(&arg, uarg, sizeof(arg)))
83 return -EFAULT;
84
85 /* Make sure reserved fields are not set for forward compatibility */
86 if (arg.reserved1 || arg.reserved2 || arg.reserved3)
87 return -EINVAL;
88
89 amr = arg.amr & mfspr(SPRN_UAMOR);
90 rc = ocxl_context_attach(ctx, amr, current->mm);
91 return rc;
92 }
93
afu_ioctl_get_metadata(struct ocxl_context * ctx,struct ocxl_ioctl_metadata __user * uarg)94 static long afu_ioctl_get_metadata(struct ocxl_context *ctx,
95 struct ocxl_ioctl_metadata __user *uarg)
96 {
97 struct ocxl_ioctl_metadata arg;
98
99 memset(&arg, 0, sizeof(arg));
100
101 arg.version = 0;
102
103 arg.afu_version_major = ctx->afu->config.version_major;
104 arg.afu_version_minor = ctx->afu->config.version_minor;
105 arg.pasid = ctx->pasid;
106 arg.pp_mmio_size = ctx->afu->config.pp_mmio_stride;
107 arg.global_mmio_size = ctx->afu->config.global_mmio_size;
108
109 if (copy_to_user(uarg, &arg, sizeof(arg)))
110 return -EFAULT;
111
112 return 0;
113 }
114
115 #ifdef CONFIG_PPC64
afu_ioctl_enable_p9_wait(struct ocxl_context * ctx,struct ocxl_ioctl_p9_wait __user * uarg)116 static long afu_ioctl_enable_p9_wait(struct ocxl_context *ctx,
117 struct ocxl_ioctl_p9_wait __user *uarg)
118 {
119 struct ocxl_ioctl_p9_wait arg;
120
121 memset(&arg, 0, sizeof(arg));
122
123 if (cpu_has_feature(CPU_FTR_P9_TIDR)) {
124 enum ocxl_context_status status;
125
126 // Locks both status & tidr
127 mutex_lock(&ctx->status_mutex);
128 if (!ctx->tidr) {
129 if (set_thread_tidr(current)) {
130 mutex_unlock(&ctx->status_mutex);
131 return -ENOENT;
132 }
133
134 ctx->tidr = current->thread.tidr;
135 }
136
137 status = ctx->status;
138 mutex_unlock(&ctx->status_mutex);
139
140 if (status == ATTACHED) {
141 int rc = ocxl_link_update_pe(ctx->afu->fn->link,
142 ctx->pasid, ctx->tidr);
143
144 if (rc)
145 return rc;
146 }
147
148 arg.thread_id = ctx->tidr;
149 } else
150 return -ENOENT;
151
152 if (copy_to_user(uarg, &arg, sizeof(arg)))
153 return -EFAULT;
154
155 return 0;
156 }
157 #endif
158
159
afu_ioctl_get_features(struct ocxl_context * ctx,struct ocxl_ioctl_features __user * uarg)160 static long afu_ioctl_get_features(struct ocxl_context *ctx,
161 struct ocxl_ioctl_features __user *uarg)
162 {
163 struct ocxl_ioctl_features arg;
164
165 memset(&arg, 0, sizeof(arg));
166
167 #ifdef CONFIG_PPC64
168 if (cpu_has_feature(CPU_FTR_P9_TIDR))
169 arg.flags[0] |= OCXL_IOCTL_FEATURES_FLAGS0_P9_WAIT;
170 #endif
171
172 if (copy_to_user(uarg, &arg, sizeof(arg)))
173 return -EFAULT;
174
175 return 0;
176 }
177
178 #define CMD_STR(x) (x == OCXL_IOCTL_ATTACH ? "ATTACH" : \
179 x == OCXL_IOCTL_IRQ_ALLOC ? "IRQ_ALLOC" : \
180 x == OCXL_IOCTL_IRQ_FREE ? "IRQ_FREE" : \
181 x == OCXL_IOCTL_IRQ_SET_FD ? "IRQ_SET_FD" : \
182 x == OCXL_IOCTL_GET_METADATA ? "GET_METADATA" : \
183 x == OCXL_IOCTL_ENABLE_P9_WAIT ? "ENABLE_P9_WAIT" : \
184 x == OCXL_IOCTL_GET_FEATURES ? "GET_FEATURES" : \
185 "UNKNOWN")
186
irq_handler(void * private)187 static irqreturn_t irq_handler(void *private)
188 {
189 struct eventfd_ctx *ev_ctx = private;
190
191 eventfd_signal(ev_ctx, 1);
192 return IRQ_HANDLED;
193 }
194
irq_free(void * private)195 static void irq_free(void *private)
196 {
197 struct eventfd_ctx *ev_ctx = private;
198
199 eventfd_ctx_put(ev_ctx);
200 }
201
afu_ioctl(struct file * file,unsigned int cmd,unsigned long args)202 static long afu_ioctl(struct file *file, unsigned int cmd,
203 unsigned long args)
204 {
205 struct ocxl_context *ctx = file->private_data;
206 struct ocxl_ioctl_irq_fd irq_fd;
207 struct eventfd_ctx *ev_ctx;
208 int irq_id;
209 u64 irq_offset;
210 long rc;
211 bool closed;
212
213 pr_debug("%s for context %d, command %s\n", __func__, ctx->pasid,
214 CMD_STR(cmd));
215
216 mutex_lock(&ctx->status_mutex);
217 closed = (ctx->status == CLOSED);
218 mutex_unlock(&ctx->status_mutex);
219
220 if (closed)
221 return -EIO;
222
223 switch (cmd) {
224 case OCXL_IOCTL_ATTACH:
225 rc = afu_ioctl_attach(ctx,
226 (struct ocxl_ioctl_attach __user *) args);
227 break;
228
229 case OCXL_IOCTL_IRQ_ALLOC:
230 rc = ocxl_afu_irq_alloc(ctx, &irq_id);
231 if (!rc) {
232 irq_offset = ocxl_irq_id_to_offset(ctx, irq_id);
233 rc = copy_to_user((u64 __user *) args, &irq_offset,
234 sizeof(irq_offset));
235 if (rc) {
236 ocxl_afu_irq_free(ctx, irq_id);
237 return -EFAULT;
238 }
239 }
240 break;
241
242 case OCXL_IOCTL_IRQ_FREE:
243 rc = copy_from_user(&irq_offset, (u64 __user *) args,
244 sizeof(irq_offset));
245 if (rc)
246 return -EFAULT;
247 irq_id = ocxl_irq_offset_to_id(ctx, irq_offset);
248 rc = ocxl_afu_irq_free(ctx, irq_id);
249 break;
250
251 case OCXL_IOCTL_IRQ_SET_FD:
252 rc = copy_from_user(&irq_fd, (u64 __user *) args,
253 sizeof(irq_fd));
254 if (rc)
255 return -EFAULT;
256 if (irq_fd.reserved)
257 return -EINVAL;
258 irq_id = ocxl_irq_offset_to_id(ctx, irq_fd.irq_offset);
259 ev_ctx = eventfd_ctx_fdget(irq_fd.eventfd);
260 if (IS_ERR(ev_ctx))
261 return PTR_ERR(ev_ctx);
262 rc = ocxl_irq_set_handler(ctx, irq_id, irq_handler, irq_free, ev_ctx);
263 break;
264
265 case OCXL_IOCTL_GET_METADATA:
266 rc = afu_ioctl_get_metadata(ctx,
267 (struct ocxl_ioctl_metadata __user *) args);
268 break;
269
270 #ifdef CONFIG_PPC64
271 case OCXL_IOCTL_ENABLE_P9_WAIT:
272 rc = afu_ioctl_enable_p9_wait(ctx,
273 (struct ocxl_ioctl_p9_wait __user *) args);
274 break;
275 #endif
276
277 case OCXL_IOCTL_GET_FEATURES:
278 rc = afu_ioctl_get_features(ctx,
279 (struct ocxl_ioctl_features __user *) args);
280 break;
281
282 default:
283 rc = -EINVAL;
284 }
285 return rc;
286 }
287
afu_compat_ioctl(struct file * file,unsigned int cmd,unsigned long args)288 static long afu_compat_ioctl(struct file *file, unsigned int cmd,
289 unsigned long args)
290 {
291 return afu_ioctl(file, cmd, args);
292 }
293
afu_mmap(struct file * file,struct vm_area_struct * vma)294 static int afu_mmap(struct file *file, struct vm_area_struct *vma)
295 {
296 struct ocxl_context *ctx = file->private_data;
297
298 pr_debug("%s for context %d\n", __func__, ctx->pasid);
299 return ocxl_context_mmap(ctx, vma);
300 }
301
has_xsl_error(struct ocxl_context * ctx)302 static bool has_xsl_error(struct ocxl_context *ctx)
303 {
304 bool ret;
305
306 mutex_lock(&ctx->xsl_error_lock);
307 ret = !!ctx->xsl_error.addr;
308 mutex_unlock(&ctx->xsl_error_lock);
309
310 return ret;
311 }
312
313 /*
314 * Are there any events pending on the AFU
315 * ctx: The AFU context
316 * Returns: true if there are events pending
317 */
afu_events_pending(struct ocxl_context * ctx)318 static bool afu_events_pending(struct ocxl_context *ctx)
319 {
320 if (has_xsl_error(ctx))
321 return true;
322 return false;
323 }
324
afu_poll(struct file * file,struct poll_table_struct * wait)325 static unsigned int afu_poll(struct file *file, struct poll_table_struct *wait)
326 {
327 struct ocxl_context *ctx = file->private_data;
328 unsigned int mask = 0;
329 bool closed;
330
331 pr_debug("%s for context %d\n", __func__, ctx->pasid);
332
333 poll_wait(file, &ctx->events_wq, wait);
334
335 mutex_lock(&ctx->status_mutex);
336 closed = (ctx->status == CLOSED);
337 mutex_unlock(&ctx->status_mutex);
338
339 if (afu_events_pending(ctx))
340 mask = EPOLLIN | EPOLLRDNORM;
341 else if (closed)
342 mask = EPOLLERR;
343
344 return mask;
345 }
346
347 /*
348 * Populate the supplied buffer with a single XSL error
349 * ctx: The AFU context to report the error from
350 * header: the event header to populate
351 * buf: The buffer to write the body into (should be at least
352 * AFU_EVENT_BODY_XSL_ERROR_SIZE)
353 * Return: the amount of buffer that was populated
354 */
append_xsl_error(struct ocxl_context * ctx,struct ocxl_kernel_event_header * header,char __user * buf)355 static ssize_t append_xsl_error(struct ocxl_context *ctx,
356 struct ocxl_kernel_event_header *header,
357 char __user *buf)
358 {
359 struct ocxl_kernel_event_xsl_fault_error body;
360
361 memset(&body, 0, sizeof(body));
362
363 mutex_lock(&ctx->xsl_error_lock);
364 if (!ctx->xsl_error.addr) {
365 mutex_unlock(&ctx->xsl_error_lock);
366 return 0;
367 }
368
369 body.addr = ctx->xsl_error.addr;
370 body.dsisr = ctx->xsl_error.dsisr;
371 body.count = ctx->xsl_error.count;
372
373 ctx->xsl_error.addr = 0;
374 ctx->xsl_error.dsisr = 0;
375 ctx->xsl_error.count = 0;
376
377 mutex_unlock(&ctx->xsl_error_lock);
378
379 header->type = OCXL_AFU_EVENT_XSL_FAULT_ERROR;
380
381 if (copy_to_user(buf, &body, sizeof(body)))
382 return -EFAULT;
383
384 return sizeof(body);
385 }
386
387 #define AFU_EVENT_BODY_MAX_SIZE sizeof(struct ocxl_kernel_event_xsl_fault_error)
388
389 /*
390 * Reports events on the AFU
391 * Format:
392 * Header (struct ocxl_kernel_event_header)
393 * Body (struct ocxl_kernel_event_*)
394 * Header...
395 */
afu_read(struct file * file,char __user * buf,size_t count,loff_t * off)396 static ssize_t afu_read(struct file *file, char __user *buf, size_t count,
397 loff_t *off)
398 {
399 struct ocxl_context *ctx = file->private_data;
400 struct ocxl_kernel_event_header header;
401 ssize_t rc;
402 ssize_t used = 0;
403 DEFINE_WAIT(event_wait);
404
405 memset(&header, 0, sizeof(header));
406
407 /* Require offset to be 0 */
408 if (*off != 0)
409 return -EINVAL;
410
411 if (count < (sizeof(struct ocxl_kernel_event_header) +
412 AFU_EVENT_BODY_MAX_SIZE))
413 return -EINVAL;
414
415 for (;;) {
416 prepare_to_wait(&ctx->events_wq, &event_wait,
417 TASK_INTERRUPTIBLE);
418
419 if (afu_events_pending(ctx))
420 break;
421
422 if (ctx->status == CLOSED)
423 break;
424
425 if (file->f_flags & O_NONBLOCK) {
426 finish_wait(&ctx->events_wq, &event_wait);
427 return -EAGAIN;
428 }
429
430 if (signal_pending(current)) {
431 finish_wait(&ctx->events_wq, &event_wait);
432 return -ERESTARTSYS;
433 }
434
435 schedule();
436 }
437
438 finish_wait(&ctx->events_wq, &event_wait);
439
440 if (has_xsl_error(ctx)) {
441 used = append_xsl_error(ctx, &header, buf + sizeof(header));
442 if (used < 0)
443 return used;
444 }
445
446 if (!afu_events_pending(ctx))
447 header.flags |= OCXL_KERNEL_EVENT_FLAG_LAST;
448
449 if (copy_to_user(buf, &header, sizeof(header)))
450 return -EFAULT;
451
452 used += sizeof(header);
453
454 rc = used;
455 return rc;
456 }
457
afu_release(struct inode * inode,struct file * file)458 static int afu_release(struct inode *inode, struct file *file)
459 {
460 struct ocxl_context *ctx = file->private_data;
461 int rc;
462
463 pr_debug("%s for device %x\n", __func__, inode->i_rdev);
464 rc = ocxl_context_detach(ctx);
465 mutex_lock(&ctx->mapping_lock);
466 ctx->mapping = NULL;
467 mutex_unlock(&ctx->mapping_lock);
468 wake_up_all(&ctx->events_wq);
469 if (rc != -EBUSY)
470 ocxl_context_free(ctx);
471 return 0;
472 }
473
474 static const struct file_operations ocxl_afu_fops = {
475 .owner = THIS_MODULE,
476 .open = afu_open,
477 .unlocked_ioctl = afu_ioctl,
478 .compat_ioctl = afu_compat_ioctl,
479 .mmap = afu_mmap,
480 .poll = afu_poll,
481 .read = afu_read,
482 .release = afu_release,
483 };
484
485 // Free the info struct
info_release(struct device * dev)486 static void info_release(struct device *dev)
487 {
488 struct ocxl_file_info *info = container_of(dev, struct ocxl_file_info, dev);
489
490 free_minor(info);
491 ocxl_afu_put(info->afu);
492 kfree(info);
493 }
494
ocxl_file_make_visible(struct ocxl_file_info * info)495 static int ocxl_file_make_visible(struct ocxl_file_info *info)
496 {
497 int rc;
498
499 cdev_init(&info->cdev, &ocxl_afu_fops);
500 rc = cdev_add(&info->cdev, info->dev.devt, 1);
501 if (rc) {
502 dev_err(&info->dev, "Unable to add afu char device: %d\n", rc);
503 return rc;
504 }
505
506 return 0;
507 }
508
ocxl_file_make_invisible(struct ocxl_file_info * info)509 static void ocxl_file_make_invisible(struct ocxl_file_info *info)
510 {
511 cdev_del(&info->cdev);
512 }
513
ocxl_file_register_afu(struct ocxl_afu * afu)514 int ocxl_file_register_afu(struct ocxl_afu *afu)
515 {
516 int minor;
517 int rc;
518 struct ocxl_file_info *info;
519 struct ocxl_fn *fn = afu->fn;
520 struct pci_dev *pci_dev = to_pci_dev(fn->dev.parent);
521
522 info = kzalloc(sizeof(*info), GFP_KERNEL);
523 if (info == NULL)
524 return -ENOMEM;
525
526 minor = allocate_minor(info);
527 if (minor < 0) {
528 kfree(info);
529 return minor;
530 }
531
532 info->dev.parent = &fn->dev;
533 info->dev.devt = MKDEV(MAJOR(ocxl_dev), minor);
534 info->dev.class = ocxl_class;
535 info->dev.release = info_release;
536
537 info->afu = afu;
538 ocxl_afu_get(afu);
539
540 rc = dev_set_name(&info->dev, "%s.%s.%hhu",
541 afu->config.name, dev_name(&pci_dev->dev), afu->config.idx);
542 if (rc)
543 goto err_put;
544
545 rc = device_register(&info->dev);
546 if (rc)
547 goto err_put;
548
549 rc = ocxl_sysfs_register_afu(info);
550 if (rc)
551 goto err_unregister;
552
553 rc = ocxl_file_make_visible(info);
554 if (rc)
555 goto err_unregister;
556
557 ocxl_afu_set_private(afu, info);
558
559 return 0;
560
561 err_unregister:
562 ocxl_sysfs_unregister_afu(info); // safe to call even if register failed
563 device_unregister(&info->dev);
564 err_put:
565 ocxl_afu_put(afu);
566 free_minor(info);
567 kfree(info);
568 return rc;
569 }
570
ocxl_file_unregister_afu(struct ocxl_afu * afu)571 void ocxl_file_unregister_afu(struct ocxl_afu *afu)
572 {
573 struct ocxl_file_info *info = ocxl_afu_get_private(afu);
574
575 if (!info)
576 return;
577
578 ocxl_file_make_invisible(info);
579 ocxl_sysfs_unregister_afu(info);
580 device_unregister(&info->dev);
581 }
582
ocxl_devnode(struct device * dev,umode_t * mode)583 static char *ocxl_devnode(struct device *dev, umode_t *mode)
584 {
585 return kasprintf(GFP_KERNEL, "ocxl/%s", dev_name(dev));
586 }
587
ocxl_file_init(void)588 int ocxl_file_init(void)
589 {
590 int rc;
591
592 mutex_init(&minors_idr_lock);
593 idr_init(&minors_idr);
594
595 rc = alloc_chrdev_region(&ocxl_dev, 0, OCXL_NUM_MINORS, "ocxl");
596 if (rc) {
597 pr_err("Unable to allocate ocxl major number: %d\n", rc);
598 return rc;
599 }
600
601 ocxl_class = class_create(THIS_MODULE, "ocxl");
602 if (IS_ERR(ocxl_class)) {
603 pr_err("Unable to create ocxl class\n");
604 unregister_chrdev_region(ocxl_dev, OCXL_NUM_MINORS);
605 return PTR_ERR(ocxl_class);
606 }
607
608 ocxl_class->devnode = ocxl_devnode;
609 return 0;
610 }
611
ocxl_file_exit(void)612 void ocxl_file_exit(void)
613 {
614 class_destroy(ocxl_class);
615 unregister_chrdev_region(ocxl_dev, OCXL_NUM_MINORS);
616 idr_destroy(&minors_idr);
617 }
618