868b32541ed21588f6a3d29c074f5f28cf77dd65
[dpdk.git] / lib / librte_eal / linuxapp / kni / kni_misc.c
1 /*-
2  * GPL LICENSE SUMMARY
3  *
4  *   Copyright(c) 2010-2014 Intel Corporation. All rights reserved.
5  *
6  *   This program is free software; you can redistribute it and/or modify
7  *   it under the terms of version 2 of the GNU General Public License as
8  *   published by the Free Software Foundation.
9  *
10  *   This program is distributed in the hope that it will be useful, but
11  *   WITHOUT ANY WARRANTY; without even the implied warranty of
12  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  *   General Public License for more details.
14  *
15  *   You should have received a copy of the GNU General Public License
16  *   along with this program; if not, write to the Free Software
17  *   Foundation, Inc., 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18  *   The full GNU General Public License is included in this distribution
19  *   in the file called LICENSE.GPL.
20  *
21  *   Contact Information:
22  *   Intel Corporation
23  */
24
25 #include <linux/module.h>
26 #include <linux/miscdevice.h>
27 #include <linux/netdevice.h>
28 #include <linux/pci.h>
29 #include <linux/kthread.h>
30 #include <linux/rwsem.h>
31
32 #include <exec-env/rte_kni_common.h>
33 #include "kni_dev.h"
34 #include <rte_config.h>
35
36 MODULE_LICENSE("Dual BSD/GPL");
37 MODULE_AUTHOR("Intel Corporation");
38 MODULE_DESCRIPTION("Kernel Module for managing kni devices");
39
40 #define KNI_RX_LOOP_NUM 1000
41
42 #define KNI_MAX_DEVICES 32
43
44 extern void kni_net_rx(struct kni_dev *kni);
45 extern void kni_net_init(struct net_device *dev);
46 extern void kni_net_config_lo_mode(char *lo_str);
47 extern void kni_net_poll_resp(struct kni_dev *kni);
48 extern void kni_set_ethtool_ops(struct net_device *netdev);
49
50 extern int ixgbe_kni_probe(struct pci_dev *pdev, struct net_device **lad_dev);
51 extern void ixgbe_kni_remove(struct pci_dev *pdev);
52 extern int igb_kni_probe(struct pci_dev *pdev, struct net_device **lad_dev);
53 extern void igb_kni_remove(struct pci_dev *pdev);
54
55 static int kni_open(struct inode *inode, struct file *file);
56 static int kni_release(struct inode *inode, struct file *file);
57 static int kni_ioctl(struct inode *inode, unsigned int ioctl_num,
58                                         unsigned long ioctl_param);
59 static int kni_compat_ioctl(struct inode *inode, unsigned int ioctl_num,
60                                                 unsigned long ioctl_param);
61 static int kni_dev_remove(struct kni_dev *dev);
62
63 static int __init kni_parse_kthread_mode(void);
64
65 /* KNI processing for single kernel thread mode */
66 static int kni_thread_single(void *unused);
67 /* KNI processing for multiple kernel thread mode */
68 static int kni_thread_multiple(void *param);
69
70 static struct file_operations kni_fops = {
71         .owner = THIS_MODULE,
72         .open = kni_open,
73         .release = kni_release,
74         .unlocked_ioctl = (void *)kni_ioctl,
75         .compat_ioctl = (void *)kni_compat_ioctl,
76 };
77
78 static struct miscdevice kni_misc = {
79         .minor = MISC_DYNAMIC_MINOR,
80         .name = KNI_DEVICE,
81         .fops = &kni_fops,
82 };
83
84 /* loopback mode */
85 static char *lo_mode = NULL;
86
87 /* Kernel thread mode */
88 static char *kthread_mode = NULL;
89 static unsigned multiple_kthread_on = 0;
90
91 #define KNI_DEV_IN_USE_BIT_NUM 0 /* Bit number for device in use */
92
93 static volatile unsigned long device_in_use; /* device in use flag */
94 static struct task_struct *kni_kthread;
95
96 /* kni list lock */
97 static DECLARE_RWSEM(kni_list_lock);
98
99 /* kni list */
100 static struct list_head kni_list_head = LIST_HEAD_INIT(kni_list_head);
101
102 static int __init
103 kni_init(void)
104 {
105         KNI_PRINT("######## DPDK kni module loading ########\n");
106
107         if (kni_parse_kthread_mode() < 0) {
108                 KNI_ERR("Invalid parameter for kthread_mode\n");
109                 return -EINVAL;
110         }
111
112         if (misc_register(&kni_misc) != 0) {
113                 KNI_ERR("Misc registration failed\n");
114                 return -EPERM;
115         }
116
117         /* Clear the bit of device in use */
118         clear_bit(KNI_DEV_IN_USE_BIT_NUM, &device_in_use);
119
120         /* Configure the lo mode according to the input parameter */
121         kni_net_config_lo_mode(lo_mode);
122
123         KNI_PRINT("######## DPDK kni module loaded  ########\n");
124
125         return 0;
126 }
127
128 static void __exit
129 kni_exit(void)
130 {
131         misc_deregister(&kni_misc);
132         KNI_PRINT("####### DPDK kni module unloaded  #######\n");
133 }
134
135 static int __init
136 kni_parse_kthread_mode(void)
137 {
138         if (!kthread_mode)
139                 return 0;
140
141         if (strcmp(kthread_mode, "single") == 0)
142                 return 0;
143         else if (strcmp(kthread_mode, "multiple") == 0)
144                 multiple_kthread_on = 1;
145         else
146                 return -1;
147
148         return 0;
149 }
150
151 static int
152 kni_open(struct inode *inode, struct file *file)
153 {
154         /* kni device can be opened by one user only, test and set bit */
155         if (test_and_set_bit(KNI_DEV_IN_USE_BIT_NUM, &device_in_use))
156                 return -EBUSY;
157
158         /* Create kernel thread for single mode */
159         if (multiple_kthread_on == 0) {
160                 KNI_PRINT("Single kernel thread for all KNI devices\n");
161                 /* Create kernel thread for RX */
162                 kni_kthread = kthread_run(kni_thread_single, NULL,
163                                                 "kni_single");
164                 if (IS_ERR(kni_kthread)) {
165                         KNI_ERR("Unable to create kernel threaed\n");
166                         return PTR_ERR(kni_kthread);
167                 }
168         } else
169                 KNI_PRINT("Multiple kernel thread mode enabled\n");
170
171         KNI_PRINT("/dev/kni opened\n");
172
173         return 0;
174 }
175
176 static int
177 kni_release(struct inode *inode, struct file *file)
178 {
179         struct kni_dev *dev, *n;
180
181         /* Stop kernel thread for single mode */
182         if (multiple_kthread_on == 0) {
183                 /* Stop kernel thread */
184                 kthread_stop(kni_kthread);
185                 kni_kthread = NULL;
186         }
187
188         down_write(&kni_list_lock);
189         list_for_each_entry_safe(dev, n, &kni_list_head, list) {
190                 /* Stop kernel thread for multiple mode */
191                 if (multiple_kthread_on && dev->pthread != NULL) {
192                         kthread_stop(dev->pthread);
193                         dev->pthread = NULL;
194                 }
195
196 #ifdef RTE_KNI_VHOST
197                 kni_vhost_backend_release(dev);
198 #endif
199                 kni_dev_remove(dev);
200                 list_del(&dev->list);
201         }
202         up_write(&kni_list_lock);
203
204         /* Clear the bit of device in use */
205         clear_bit(KNI_DEV_IN_USE_BIT_NUM, &device_in_use);
206
207         KNI_PRINT("/dev/kni closed\n");
208
209         return 0;
210 }
211
212 static int
213 kni_thread_single(void *unused)
214 {
215         int j;
216         struct kni_dev *dev, *n;
217
218         while (!kthread_should_stop()) {
219                 down_read(&kni_list_lock);
220                 for (j = 0; j < KNI_RX_LOOP_NUM; j++) {
221                         list_for_each_entry_safe(dev, n,
222                                         &kni_list_head, list) {
223 #ifdef RTE_KNI_VHOST
224                                 kni_chk_vhost_rx(dev);
225 #else
226                                 kni_net_rx(dev);
227 #endif
228                                 kni_net_poll_resp(dev);
229                         }
230                 }
231                 up_read(&kni_list_lock);
232                 /* reschedule out for a while */
233                 schedule_timeout_interruptible(usecs_to_jiffies( \
234                                 KNI_KTHREAD_RESCHEDULE_INTERVAL));
235         }
236
237         return 0;
238 }
239
240 static int
241 kni_thread_multiple(void *param)
242 {
243         int j;
244         struct kni_dev *dev = (struct kni_dev *)param;
245
246         while (!kthread_should_stop()) {
247                 for (j = 0; j < KNI_RX_LOOP_NUM; j++) {
248 #ifdef RTE_KNI_VHOST
249                         kni_chk_vhost_rx(dev);
250 #else
251                         kni_net_rx(dev);
252 #endif
253                         kni_net_poll_resp(dev);
254                 }
255                 schedule_timeout_interruptible(usecs_to_jiffies( \
256                                 KNI_KTHREAD_RESCHEDULE_INTERVAL));
257         }
258
259         return 0;
260 }
261
262 static int
263 kni_dev_remove(struct kni_dev *dev)
264 {
265         if (!dev)
266                 return -ENODEV;
267
268         switch (dev->device_id) {
269         #define RTE_PCI_DEV_ID_DECL_IGB(vend, dev) case (dev):
270         #include <rte_pci_dev_ids.h>
271                 igb_kni_remove(dev->pci_dev);
272                 break;
273         #define RTE_PCI_DEV_ID_DECL_IXGBE(vend, dev) case (dev):
274         #include <rte_pci_dev_ids.h>
275                 ixgbe_kni_remove(dev->pci_dev);
276                 break;
277         default:
278                 break;
279         }
280
281         if (dev->net_dev) {
282                 unregister_netdev(dev->net_dev);
283                 free_netdev(dev->net_dev);
284         }
285
286         return 0;
287 }
288
289 static int
290 kni_check_param(struct kni_dev *kni, struct rte_kni_device_info *dev)
291 {
292         if (!kni || !dev)
293                 return -1;
294
295         /* Check if network name has been used */
296         if (!strncmp(kni->name, dev->name, RTE_KNI_NAMESIZE)) {
297                 KNI_ERR("KNI name %s duplicated\n", dev->name);
298                 return -1;
299         }
300
301         return 0;
302 }
303
304 static int
305 kni_ioctl_create(unsigned int ioctl_num, unsigned long ioctl_param)
306 {
307         int ret;
308         struct rte_kni_device_info dev_info;
309         struct pci_dev *pci = NULL;
310         struct pci_dev *found_pci = NULL;
311         struct net_device *net_dev = NULL;
312         struct net_device *lad_dev = NULL;
313         struct kni_dev *kni, *dev, *n;
314         struct net *net;
315
316         printk(KERN_INFO "KNI: Creating kni...\n");
317         /* Check the buffer size, to avoid warning */
318         if (_IOC_SIZE(ioctl_num) > sizeof(dev_info))
319                 return -EINVAL;
320
321         /* Copy kni info from user space */
322         ret = copy_from_user(&dev_info, (void *)ioctl_param, sizeof(dev_info));
323         if (ret) {
324                 KNI_ERR("copy_from_user in kni_ioctl_create");
325                 return -EIO;
326         }
327
328         /**
329          * Check if the cpu core id is valid for binding,
330          * for multiple kernel thread mode.
331          */
332         if (multiple_kthread_on && dev_info.force_bind &&
333                                 !cpu_online(dev_info.core_id)) {
334                 KNI_ERR("cpu %u is not online\n", dev_info.core_id);
335                 return -EINVAL;
336         }
337
338         /* Check if it has been created */
339         down_read(&kni_list_lock);
340         list_for_each_entry_safe(dev, n, &kni_list_head, list) {
341                 if (kni_check_param(dev, &dev_info) < 0) {
342                         up_read(&kni_list_lock);
343                         return -EINVAL;
344                 }
345         }
346         up_read(&kni_list_lock);
347
348         net_dev = alloc_netdev(sizeof(struct kni_dev), dev_info.name,
349 #ifdef NET_NAME_UNKNOWN
350                                                         NET_NAME_UNKNOWN,
351 #endif
352                                                         kni_net_init);
353         if (net_dev == NULL) {
354                 KNI_ERR("error allocating device \"%s\"\n", dev_info.name);
355                 return -EBUSY;
356         }
357
358         net = get_net_ns_by_pid(current->pid);
359         if (IS_ERR(net)) {
360                 free_netdev(net_dev);
361                 return PTR_ERR(net);
362         }
363         dev_net_set(net_dev, net);
364         put_net(net);
365
366         kni = netdev_priv(net_dev);
367
368         kni->net_dev = net_dev;
369         kni->group_id = dev_info.group_id;
370         kni->core_id = dev_info.core_id;
371         strncpy(kni->name, dev_info.name, RTE_KNI_NAMESIZE);
372
373         /* Translate user space info into kernel space info */
374         kni->tx_q = phys_to_virt(dev_info.tx_phys);
375         kni->rx_q = phys_to_virt(dev_info.rx_phys);
376         kni->alloc_q = phys_to_virt(dev_info.alloc_phys);
377         kni->free_q = phys_to_virt(dev_info.free_phys);
378
379         kni->req_q = phys_to_virt(dev_info.req_phys);
380         kni->resp_q = phys_to_virt(dev_info.resp_phys);
381         kni->sync_va = dev_info.sync_va;
382         kni->sync_kva = phys_to_virt(dev_info.sync_phys);
383
384         kni->mbuf_kva = phys_to_virt(dev_info.mbuf_phys);
385         kni->mbuf_va = dev_info.mbuf_va;
386
387 #ifdef RTE_KNI_VHOST
388         kni->vhost_queue = NULL;
389         kni->vq_status = BE_STOP;
390 #endif
391         kni->mbuf_size = dev_info.mbuf_size;
392
393         KNI_PRINT("tx_phys:      0x%016llx, tx_q addr:      0x%p\n",
394                 (unsigned long long) dev_info.tx_phys, kni->tx_q);
395         KNI_PRINT("rx_phys:      0x%016llx, rx_q addr:      0x%p\n",
396                 (unsigned long long) dev_info.rx_phys, kni->rx_q);
397         KNI_PRINT("alloc_phys:   0x%016llx, alloc_q addr:   0x%p\n",
398                 (unsigned long long) dev_info.alloc_phys, kni->alloc_q);
399         KNI_PRINT("free_phys:    0x%016llx, free_q addr:    0x%p\n",
400                 (unsigned long long) dev_info.free_phys, kni->free_q);
401         KNI_PRINT("req_phys:     0x%016llx, req_q addr:     0x%p\n",
402                 (unsigned long long) dev_info.req_phys, kni->req_q);
403         KNI_PRINT("resp_phys:    0x%016llx, resp_q addr:    0x%p\n",
404                 (unsigned long long) dev_info.resp_phys, kni->resp_q);
405         KNI_PRINT("mbuf_phys:    0x%016llx, mbuf_kva:       0x%p\n",
406                 (unsigned long long) dev_info.mbuf_phys, kni->mbuf_kva);
407         KNI_PRINT("mbuf_va:      0x%p\n", dev_info.mbuf_va);
408         KNI_PRINT("mbuf_size:    %u\n", kni->mbuf_size);
409
410         KNI_DBG("PCI: %02x:%02x.%02x %04x:%04x\n",
411                                         dev_info.bus,
412                                         dev_info.devid,
413                                         dev_info.function,
414                                         dev_info.vendor_id,
415                                         dev_info.device_id);
416
417         pci = pci_get_device(dev_info.vendor_id, dev_info.device_id, NULL);
418
419         /* Support Ethtool */
420         while (pci) {
421                 KNI_PRINT("pci_bus: %02x:%02x:%02x \n",
422                                         pci->bus->number,
423                                         PCI_SLOT(pci->devfn),
424                                         PCI_FUNC(pci->devfn));
425
426                 if ((pci->bus->number == dev_info.bus) &&
427                         (PCI_SLOT(pci->devfn) == dev_info.devid) &&
428                         (PCI_FUNC(pci->devfn) == dev_info.function)) {
429                         found_pci = pci;
430                         switch (dev_info.device_id) {
431                         #define RTE_PCI_DEV_ID_DECL_IGB(vend, dev) case (dev):
432                         #include <rte_pci_dev_ids.h>
433                                 ret = igb_kni_probe(found_pci, &lad_dev);
434                                 break;
435                         #define RTE_PCI_DEV_ID_DECL_IXGBE(vend, dev) \
436                                                         case (dev):
437                         #include <rte_pci_dev_ids.h>
438                                 ret = ixgbe_kni_probe(found_pci, &lad_dev);
439                                 break;
440                         default:
441                                 ret = -1;
442                                 break;
443                         }
444
445                         KNI_DBG("PCI found: pci=0x%p, lad_dev=0x%p\n",
446                                                         pci, lad_dev);
447                         if (ret == 0) {
448                                 kni->lad_dev = lad_dev;
449                                 kni_set_ethtool_ops(kni->net_dev);
450                         } else {
451                                 KNI_ERR("Device not supported by ethtool");
452                                 kni->lad_dev = NULL;
453                         }
454
455                         kni->pci_dev = found_pci;
456                         kni->device_id = dev_info.device_id;
457                         break;
458                 }
459                 pci = pci_get_device(dev_info.vendor_id,
460                                 dev_info.device_id, pci);
461         }
462         if (pci)
463                 pci_dev_put(pci);
464
465         ret = register_netdev(net_dev);
466         if (ret) {
467                 KNI_ERR("error %i registering device \"%s\"\n",
468                                         ret, dev_info.name);
469                 kni_dev_remove(kni);
470                 return -ENODEV;
471         }
472
473 #ifdef RTE_KNI_VHOST
474         kni_vhost_init(kni);
475 #endif
476
477         /**
478          * Create a new kernel thread for multiple mode, set its core affinity,
479          * and finally wake it up.
480          */
481         if (multiple_kthread_on) {
482                 kni->pthread = kthread_create(kni_thread_multiple,
483                                               (void *)kni,
484                                               "kni_%s", kni->name);
485                 if (IS_ERR(kni->pthread)) {
486                         kni_dev_remove(kni);
487                         return -ECANCELED;
488                 }
489                 if (dev_info.force_bind)
490                         kthread_bind(kni->pthread, kni->core_id);
491                 wake_up_process(kni->pthread);
492         }
493
494         down_write(&kni_list_lock);
495         list_add(&kni->list, &kni_list_head);
496         up_write(&kni_list_lock);
497
498         return 0;
499 }
500
501 static int
502 kni_ioctl_release(unsigned int ioctl_num, unsigned long ioctl_param)
503 {
504         int ret = -EINVAL;
505         struct kni_dev *dev, *n;
506         struct rte_kni_device_info dev_info;
507
508         if (_IOC_SIZE(ioctl_num) > sizeof(dev_info))
509                         return -EINVAL;
510
511         ret = copy_from_user(&dev_info, (void *)ioctl_param, sizeof(dev_info));
512         if (ret) {
513                 KNI_ERR("copy_from_user in kni_ioctl_release");
514                 return -EIO;
515         }
516
517         /* Release the network device according to its name */
518         if (strlen(dev_info.name) == 0)
519                 return ret;
520
521         down_write(&kni_list_lock);
522         list_for_each_entry_safe(dev, n, &kni_list_head, list) {
523                 if (strncmp(dev->name, dev_info.name, RTE_KNI_NAMESIZE) != 0)
524                         continue;
525
526                 if (multiple_kthread_on && dev->pthread != NULL) {
527                         kthread_stop(dev->pthread);
528                         dev->pthread = NULL;
529                 }
530
531 #ifdef RTE_KNI_VHOST
532                 kni_vhost_backend_release(dev);
533 #endif
534                 kni_dev_remove(dev);
535                 list_del(&dev->list);
536                 ret = 0;
537                 break;
538         }
539         up_write(&kni_list_lock);
540         printk(KERN_INFO "KNI: %s release kni named %s\n",
541                 (ret == 0 ? "Successfully" : "Unsuccessfully"), dev_info.name);
542
543         return ret;
544 }
545
546 static int
547 kni_ioctl(struct inode *inode,
548         unsigned int ioctl_num,
549         unsigned long ioctl_param)
550 {
551         int ret = -EINVAL;
552
553         KNI_DBG("IOCTL num=0x%0x param=0x%0lx \n", ioctl_num, ioctl_param);
554
555         /*
556          * Switch according to the ioctl called
557          */
558         switch (_IOC_NR(ioctl_num)) {
559         case _IOC_NR(RTE_KNI_IOCTL_TEST):
560                 /* For test only, not used */
561                 break;
562         case _IOC_NR(RTE_KNI_IOCTL_CREATE):
563                 ret = kni_ioctl_create(ioctl_num, ioctl_param);
564                 break;
565         case _IOC_NR(RTE_KNI_IOCTL_RELEASE):
566                 ret = kni_ioctl_release(ioctl_num, ioctl_param);
567                 break;
568         default:
569                 KNI_DBG("IOCTL default \n");
570                 break;
571         }
572
573         return ret;
574 }
575
576 static int
577 kni_compat_ioctl(struct inode *inode,
578                 unsigned int ioctl_num,
579                 unsigned long ioctl_param)
580 {
581         /* 32 bits app on 64 bits OS to be supported later */
582         KNI_PRINT("Not implemented.\n");
583
584         return -EINVAL;
585 }
586
587 module_init(kni_init);
588 module_exit(kni_exit);
589
590 module_param(lo_mode, charp, S_IRUGO | S_IWUSR);
591 MODULE_PARM_DESC(lo_mode,
592 "KNI loopback mode (default=lo_mode_none):\n"
593 "    lo_mode_none        Kernel loopback disabled\n"
594 "    lo_mode_fifo        Enable kernel loopback with fifo\n"
595 "    lo_mode_fifo_skb    Enable kernel loopback with fifo and skb buffer\n"
596 "\n"
597 );
598
599 module_param(kthread_mode, charp, S_IRUGO);
600 MODULE_PARM_DESC(kthread_mode,
601 "Kernel thread mode (default=single):\n"
602 "    single    Single kernel thread mode enabled.\n"
603 "    multiple  Multiple kernel thread mode enabled.\n"
604 "\n"
605 );
606