2 Palacios VNET interface
5 #include <linux/spinlock.h>
6 #include <linux/seq_file.h>
7 #include <linux/proc_fs.h>
8 #include <asm/uaccess.h>
9 #include <linux/inet.h>
10 #include <linux/kthread.h>
12 #include <linux/netdevice.h>
15 #include <linux/string.h>
16 #include <linux/preempt.h>
17 #include <linux/sched.h>
20 #include <palacios/vmm_vnet.h>
21 #include "palacios-vnet.h"
23 //#define DEBUG_VNET_BRIGE
25 #define VNET_UDP_PORT 9000
27 struct palacios_vnet_route {
28 struct v3_vnet_route route;
32 struct list_head node;
41 struct sockaddr_in sock_addr;
45 struct list_head node;
48 struct palacios_vnet_state {
52 struct list_head route_list;
53 struct list_head link_list;
55 struct socket * serv_sock;
56 struct sockaddr_in serv_addr;
58 /* The thread recving pkts from sockets. */
59 struct task_struct * serv_thread;
62 unsigned long pkt_sent, pkt_recv, pkt_drop, pkt_udp_recv, pkt_udp_send;
66 static struct palacios_vnet_state vnet_state;
69 struct vnet_link * link_by_ip(uint32_t ip) {
70 struct vnet_link * link = NULL;
72 list_for_each_entry(link, &(vnet_state.link_list), node) {
74 if (link->dst_ip == ip) {
82 struct vnet_link * link_by_idx(int idx) {
83 struct vnet_link * link = NULL;
85 list_for_each_entry(link, &(vnet_state.link_list), node) {
87 if (link->link_idx == idx) {
94 struct palacios_vnet_route * route_by_idx(int idx) {
95 struct palacios_vnet_route * route = NULL;
97 list_for_each_entry(route, &(vnet_state.route_list), node) {
99 if (route->route_idx == idx) {
108 static int parse_mac_str(char * str, uint8_t * qual, uint8_t * mac) {
111 printk("Parsing MAC (%s)\n", str);
114 if(strnicmp("any", str, strlen(str)) == 0){
117 }else if(strnicmp("none", str, strlen(str)) == 0){
121 if (strstr(str, "-")) {
122 token = strsep(&str, "-");
124 if (strnicmp("not", token, strlen("not")) == 0) {
127 printk("Invalid MAC String token (%s)\n", token);
132 if (strstr(str, ":")) {
135 if(*qual == MAC_NOSET){
139 for (i = 0; i < 6; i++) {
140 token = strsep(&str, ":");
142 printk("Invalid MAC String token (%s)\n", token);
145 mac[i] = simple_strtol(token, &token, 16);
147 printk("MAC: %2x:%2x:%2x:%2x:%2x:%2x\n", mac[0], mac[1], mac[2], mac[3], mac[4], mac[5]);
150 printk("Invalid MAC String token (%s)\n", token);
160 static int str2mac(char * str, uint8_t * mac){
164 for (i = 0; i < ETH_ALEN; i++) {
165 hex = strsep(&str, ":");
167 printk("Invalid MAC String token (%s)\n", str);
170 mac[i] = simple_strtol(hex, &hex, 16);
178 * add src-MAC dst-MAC dst-TYPE [dst-ID] src-TYPE [src-ID]
180 * src-MAC = dst-MAC = not-MAC|any|none|MAC
181 * dst-TYPE = edge|interface
182 * src-TYPE = edge|interface|any
183 * dst-ID = src-ID = IP|MAC
184 * MAC=xx:xx:xx:xx:xx:xx
185 * IP = xxx.xxx.xxx.xxx
187 static int parse_route_str(char * str, struct v3_vnet_route * route) {
189 struct vnet_link *link = NULL;
192 token = strsep(&str, " ");
196 parse_mac_str(token, &(route->src_mac_qual), route->src_mac);
199 token = strsep(&str, " ");
203 parse_mac_str(token, &(route->dst_mac_qual), route->dst_mac);
206 token = strsep(&str, " ");
210 printk("dst type =(%s)\n", token);
212 if (strnicmp("interface", token, strlen("interface")) == 0) {
213 route->dst_type = LINK_INTERFACE;
214 } else if (strnicmp("edge", token, strlen("edge")) == 0) {
215 route->dst_type = LINK_EDGE;
217 printk("Invalid Destination Link Type (%s)\n", token);
222 token = strsep(&str, " ");
226 printk("dst link ID=(%s)\n", token);
228 // Figure out link here
229 if (route->dst_type == LINK_EDGE) {
232 // Figure out Link Here
233 if (in4_pton(token, strlen(token), (uint8_t *)&(link_ip), '\0', NULL) != 1) {
234 printk("Invalid Dst IP address (%s)\n", token);
238 link = link_by_ip(link_ip);
240 route->dst_id = link->link_idx;
242 printk("can not find dst link %s\n", token);
246 printk("link_ip = %d, link_id = %d\n", link_ip, link->link_idx);
247 } else if (route->dst_type == LINK_INTERFACE) {
248 uint8_t mac[ETH_ALEN];
250 if(str2mac(token, mac) == -1){
251 printk("wrong MAC format (%s)\n", token);
255 route->dst_id = v3_vnet_find_dev(mac);
256 if (route->dst_id == -1){
257 printk("can not find dst device %s\n", token);
261 printk("Unsupported dst link type\n");
266 route->src_type = -1;
269 token = strsep(&str, " ");
271 printk("SRC type = %s\n", token);
277 if (strnicmp("interface", token, strlen("interface")) == 0) {
278 route->src_type = LINK_INTERFACE;
279 } else if (strnicmp("edge", token, strlen("edge")) == 0) {
280 route->src_type = LINK_EDGE;
281 } else if (strnicmp("any", token, strlen("any")) == 0) {
282 route->src_type = LINK_ANY;
284 printk("Invalid Src link type (%s)\n", token);
289 if (route->src_type == LINK_ANY) {
291 } else if (route->src_type == LINK_EDGE) {
293 token = strsep(&str, " ");
299 // Figure out Link Here
300 if (in4_pton(token, strlen(token), (uint8_t *)&(src_ip), '\0', NULL) != 1) {
301 printk("Invalid SRC IP address (%s)\n", token);
305 link = link_by_ip(src_ip);
307 route->src_id = link->link_idx;
309 printk("can not find src link %s\n", token);
312 } else if(route->src_type == LINK_INTERFACE){
313 uint8_t mac[ETH_ALEN];
315 if(str2mac(token, mac) == -1){
316 printk("wrong MAC format (%s)\n", token);
320 route->src_id = v3_vnet_find_dev(mac);
321 if (route->src_id == -1){
322 printk("can not find dst device %s\n", token);
326 printk("Invalid link type\n");
336 static void * route_seq_start(struct seq_file * s, loff_t * pos) {
337 struct palacios_vnet_route * route_iter = NULL;
341 if (*pos >= vnet_state.num_routes) {
345 list_for_each_entry(route_iter, &(vnet_state.route_list), node) {
358 static void * link_seq_start(struct seq_file * s, loff_t * pos) {
359 struct vnet_link * link_iter = NULL;
362 if (*pos >= vnet_state.num_links) {
366 list_for_each_entry(link_iter, &(vnet_state.link_list), node) {
380 static void * route_seq_next(struct seq_file * s, void * v, loff_t * pos) {
381 struct palacios_vnet_route * route_iter = NULL;
383 route_iter = list_entry(((struct palacios_vnet_route *)v)->node.next, struct palacios_vnet_route, node);
385 // Check if the list has looped
386 if (&(route_iter->node) == &(vnet_state.route_list)) {
396 static void * link_seq_next(struct seq_file * s, void * v, loff_t * pos) {
397 struct vnet_link * link_iter = NULL;
400 link_iter = list_entry(((struct vnet_link *)v)->node.next, struct vnet_link, node);
402 // Check if the list has looped
403 if (&(link_iter->node) == &(vnet_state.link_list)) {
413 static void route_seq_stop(struct seq_file * s, void * v) {
414 printk("route_seq_stop\n");
420 static void link_seq_stop(struct seq_file * s, void * v) {
421 printk("link_seq_stop\n");
426 static int route_seq_show(struct seq_file * s, void * v) {
427 struct palacios_vnet_route * route_iter = v;
428 struct v3_vnet_route * route = &(route_iter->route);
430 seq_printf(s, "%d:\t", route_iter->route_idx);
432 seq_printf(s, "\nSrc:\t");
433 switch (route->src_mac_qual) {
435 seq_printf(s, "any ");
438 seq_printf(s, "none ");
441 seq_printf(s, "not-%2x:%2x:%2x:%2x:%2x:%2x ",
442 route->src_mac[0], route->src_mac[1], route->src_mac[2],
443 route->src_mac[3], route->src_mac[4], route->src_mac[5]);
446 seq_printf(s, "%x:%x:%x:%x:%x:%x ",
447 route->src_mac[0], route->src_mac[1], route->src_mac[2],
448 route->src_mac[3], route->src_mac[4], route->src_mac[5]);
452 seq_printf(s, "\nDst:\t");
453 switch (route->dst_mac_qual) {
455 seq_printf(s, "any ");
458 seq_printf(s, "none ");
461 seq_printf(s, "not-%x:%x:%x:%x:%x:%x ",
462 route->src_mac[0], route->src_mac[1], route->src_mac[2],
463 route->src_mac[3], route->src_mac[4], route->src_mac[5]);
466 seq_printf(s, "%x:%x:%x:%x:%x:%x ",
467 route->src_mac[0], route->src_mac[1], route->src_mac[2],
468 route->src_mac[3], route->src_mac[4], route->src_mac[5]);
472 seq_printf(s, "\nDst-Type:\t");
473 switch (route->dst_type) {
475 struct vnet_link * link = (struct vnet_link *)link_by_idx(route->dst_id);
476 seq_printf(s, "EDGE %pI4", &link->dst_ip);
479 case LINK_INTERFACE: {
480 seq_printf(s, "INTERFACE ");
481 seq_printf(s, "%d ", route->dst_id);
485 seq_printf(s, "Invalid Dst Link Type (%d) ", route->dst_type);
489 seq_printf(s, "\nSrc-Type:\t");
490 switch (route->src_type) {
492 struct vnet_link * link = (struct vnet_link *)link_by_idx(route->src_id);
493 seq_printf(s, "EDGE %pI4", &link->dst_ip);
496 case LINK_INTERFACE: {
497 seq_printf(s, "INTERFACE %d", route->src_id);
501 seq_printf(s, "ANY");
504 seq_printf(s, "Invalid Src Link Type (%d) ", route->src_type);
515 static int link_seq_show(struct seq_file * s, void * v) {
516 struct vnet_link * link_iter = v;
518 seq_printf(s, "%d:\t%pI4\t%d\n",
521 link_iter->dst_port);
527 static struct seq_operations route_seq_ops = {
528 .start = route_seq_start,
529 .next = route_seq_next,
530 .stop = route_seq_stop,
531 .show = route_seq_show
535 static struct seq_operations link_seq_ops = {
536 .start = link_seq_start,
537 .next = link_seq_next,
538 .stop = link_seq_stop,
539 .show = link_seq_show
543 static int route_open(struct inode * inode, struct file * file) {
544 return seq_open(file, &route_seq_ops);
548 static int link_open(struct inode * inode, struct file * file) {
549 return seq_open(file, &link_seq_ops);
552 static int inject_route(struct palacios_vnet_route * route) {
555 v3_vnet_add_route(route->route);
557 spin_lock_irqsave(&(vnet_state.lock), flags);
558 list_add(&(route->node), &(vnet_state.route_list));
559 route->route_idx = vnet_state.num_routes++;
560 spin_unlock_irqrestore(&(vnet_state.lock), flags);
562 printk("Palacios-vnet: One route added to VNET core\n");
568 route_write(struct file * file,
573 char * buf_iter = NULL;
574 char * line_str = route_buf;
581 if (copy_from_user(route_buf, buf, size)) {
585 printk("Route written: %s\n", route_buf);
587 while ((buf_iter = strsep(&line_str, "\r\n"))) {
589 token = strsep(&buf_iter, " ");
594 if (strnicmp("ADD", token, strlen("ADD")) == 0) {
595 struct palacios_vnet_route * new_route = NULL;
596 new_route = kmalloc(sizeof(struct palacios_vnet_route), GFP_KERNEL);
602 memset(new_route, 0, sizeof(struct palacios_vnet_route));
604 if (parse_route_str(buf_iter, &(new_route->route)) == -1) {
609 if (inject_route(new_route) != 0) {
612 } else if (strnicmp("DEL", token, strlen("DEL")) == 0) {
613 printk("I should delete the route here\n");
615 printk("Invalid Route command string\n");
623 static int create_link(struct vnet_link * link) {
627 if ( (err = sock_create(AF_INET, SOCK_DGRAM, IPPROTO_UDP, &link->sock)) < 0) {
628 printk("Could not create socket\n");
632 memset(&link->sock_addr, 0, sizeof(struct sockaddr));
634 link->sock_addr.sin_family = AF_INET;
635 link->sock_addr.sin_addr.s_addr = link->dst_ip;
636 link->sock_addr.sin_port = htons(link->dst_port);
638 if ((err = link->sock->ops->connect(link->sock, (struct sockaddr *)&(link->sock_addr), sizeof(struct sockaddr), 0) < 0)) {
639 printk("Could not connect to remote host\n");
643 // We use the file pointer because we are in the kernel
644 // This is only used to assigned File Descriptors for user space, so it is available here
645 // link->sock->file = link;
647 spin_lock_irqsave(&(vnet_state.lock), flags);
648 list_add(&(link->node), &(vnet_state.link_list));
649 link->link_idx = vnet_state.num_links++;
650 spin_unlock_irqrestore(&(vnet_state.lock), flags);
652 printk("VNET Bridge: Link created, ip %d, port: %d, idx: %d, link: %p\n",
662 /* ADD dst-ip 9000 */
664 link_write(struct file * file, const char * buf, size_t size, loff_t * ppos) {
666 char * link_iter = NULL;
667 char * line_str = link_buf;
674 if (copy_from_user(link_buf, buf, size)) {
678 while ((link_iter = strsep(&line_str, "\r\n"))) {
679 printk("Link written: %s\n", link_buf);
681 token = strsep(&link_iter, " ");
687 if (strnicmp("ADD", token, strlen("ADD")) == 0) {
688 struct vnet_link * new_link = NULL;
689 char * ip_str = NULL;
692 ip_str = strsep(&link_iter, " ");
694 if ((!ip_str) || (!link_iter)) {
695 printk("Missing fields in ADD Link command\n");
699 if (in4_pton(ip_str, strlen(ip_str), (uint8_t *)&(ip), '\0', NULL) != 1) {
700 printk("Invalid Dst IP address (%s)\n", ip_str);
704 new_link = kmalloc(sizeof(struct vnet_link), GFP_KERNEL);
710 memset(new_link, 0, sizeof(struct vnet_link));
712 new_link->dst_ip = ip;
713 new_link->dst_port = simple_strtol(link_iter, &link_iter, 10);
715 if (create_link(new_link) != 0) {
716 printk("Could not create link\n");
721 } else if (strnicmp("DEL", token, strlen("DEL")) == 0) {
722 printk("Link deletion not supported\n");
724 printk("Invalid Link command string\n");
732 static struct file_operations route_fops = {
733 .owner = THIS_MODULE,
736 .write = route_write,
738 .release = seq_release
742 static struct file_operations link_fops = {
743 .owner = THIS_MODULE,
748 .release = seq_release
752 static int init_proc_files(void) {
753 struct proc_dir_entry * route_entry = NULL;
754 struct proc_dir_entry * link_entry = NULL;
755 struct proc_dir_entry * vnet_root = NULL;
758 vnet_root = proc_mkdir("vnet", NULL);
759 if (vnet_root == NULL) {
763 route_entry = create_proc_entry("routes", 0, vnet_root);
765 if (route_entry == NULL) {
766 remove_proc_entry("vnet", NULL);
770 route_entry->proc_fops = &route_fops;
773 link_entry = create_proc_entry("links", 0, vnet_root);
775 if (link_entry == NULL) {
776 remove_proc_entry("routes", vnet_root);
777 remove_proc_entry("vnet", NULL);
781 link_entry->proc_fops = &link_fops;
790 udp_send(struct socket * sock,
791 struct sockaddr_in * addr,
792 unsigned char * buf, int len) {
799 if (sock->sk == NULL) {
808 msg.msg_namelen = sizeof(struct sockaddr_in);
809 msg.msg_control = NULL;
810 msg.msg_controllen = 0;
813 msg.msg_control = NULL;
817 size = sock_sendmsg(sock, &msg, len);
826 udp_recv(struct socket * sock,
827 struct sockaddr_in * addr,
828 unsigned char * buf, int len) {
834 if (sock->sk == NULL) {
843 msg.msg_namelen = sizeof(struct sockaddr_in);
844 msg.msg_control = NULL;
845 msg.msg_controllen = 0;
848 msg.msg_control = NULL;
852 size = sock_recvmsg(sock, &msg, len, msg.msg_flags);
859 //send packets from Network to VNET core
861 send_to_palacios(unsigned char * buf,
864 struct v3_vnet_pkt pkt;
866 pkt.src_type = LINK_EDGE;
867 pkt.src_id = link_id;
868 memcpy(pkt.header, buf, ETHERNET_HEADER_LEN);
871 #ifdef CONFIG_PALACIOS_VNET_DEBUG
873 printk("VNET Lnx Bridge: send pkt to VNET core (size: %d, src_id: %d, src_type: %d)\n",
874 pkt.size, pkt.src_id, pkt.src_type);
876 print_hex_dump(NULL, "pkt_data: ", 0, 20, 20, pkt.data, pkt.size, 0);
880 return v3_vnet_send_pkt(&pkt, NULL);;
884 //send packet from VNET core to Network
886 bridge_send_pkt(struct v3_vm_info * vm,
887 struct v3_vnet_pkt * pkt,
888 void * private_data) {
889 struct vnet_link * link;
891 #ifdef CONFIG_PALACIOS_VNET_DEBUG
893 printk("VNET Lnx Host Bridge: packet received from VNET Core ... len: %d, pkt size: %d, link: %d\n",
898 print_hex_dump(NULL, "pkt_data: ", 0, 20, 20, pkt->data, pkt->size, 0);
902 vnet_state.pkt_recv ++;
904 link = link_by_idx(pkt->dst_id);
906 udp_send(link->sock, &(link->sock_addr), pkt->data, pkt->size);
907 vnet_state.pkt_udp_send ++;
909 printk("VNET Bridge Linux Host: wrong dst link, idx: %d, discards the packet\n", pkt->dst_id);
910 vnet_state.pkt_drop ++;
918 poll_pkt(struct v3_vm_info * vm,
919 void * private_data) {
926 static int init_vnet_serv(void) {
928 if (sock_create(AF_INET, SOCK_DGRAM, IPPROTO_UDP, &vnet_state.serv_sock) < 0) {
929 printk("Could not create socket\n");
933 memset(&vnet_state.serv_addr, 0, sizeof(struct sockaddr));
935 vnet_state.serv_addr.sin_family = AF_INET;
936 vnet_state.serv_addr.sin_addr.s_addr = htonl(INADDR_ANY);
937 vnet_state.serv_addr.sin_port = htons(VNET_UDP_PORT);
939 if (vnet_state.serv_sock->ops->bind(vnet_state.serv_sock, (struct sockaddr *)&(vnet_state.serv_addr), sizeof(struct sockaddr)) < 0) {
940 printk("Could not bind VNET server socket to port %d\n", VNET_UDP_PORT);
944 printk("VNET server bind to port: %d\n", VNET_UDP_PORT);
949 static int vnet_server(void * arg) {
950 unsigned char pkt[ETHERNET_PACKET_LEN];
951 struct sockaddr_in pkt_addr;
952 struct vnet_link *link = NULL;
956 printk("Palacios VNET Bridge: UDP receiving server ..... \n");
958 while (!kthread_should_stop()) {
960 len = udp_recv(vnet_state.serv_sock, &pkt_addr, pkt, ETHERNET_PACKET_LEN);
962 printk("Receive error: Could not get packet, error %d\n", len);
966 link = link_by_ip(ntohl(pkt_addr.sin_addr.s_addr));
968 link_id= link->link_idx;
974 vnet_state.pkt_udp_recv ++;
976 send_to_palacios(pkt, len, link_id);
983 int palacios_init_vnet(void) {
984 struct v3_vnet_bridge_ops bridge_ops;
986 memset(&vnet_state, 0, sizeof(struct palacios_vnet_state));
988 INIT_LIST_HEAD(&(vnet_state.link_list));
989 INIT_LIST_HEAD(&(vnet_state.route_list));
990 spin_lock_init(&(vnet_state.lock));
993 if(init_vnet_serv() < 0){
994 printk("Failure to initiate VNET server\n");
998 vnet_state.serv_thread = kthread_run(vnet_server, NULL, "vnet-server");
1000 //kthread_run(profiling, NULL, "Profiling");
1002 bridge_ops.input = bridge_send_pkt;
1003 bridge_ops.poll = poll_pkt;
1005 v3_vnet_add_bridge(NULL, &bridge_ops, HOST_LNX_BRIDGE, NULL);
1007 printk("Palacios VNET Linux Bridge initiated\n");