blob: c68808336c8c4d84e90e03a8d0649592b72c1626 [file] [log] [blame]
Rusty Russell296f96f2007-10-22 11:03:37 +10001/* A simple network driver using virtio.
2 *
3 * Copyright 2007 Rusty Russell <rusty@rustcorp.com.au> IBM Corporation
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19//#define DEBUG
20#include <linux/netdevice.h>
21#include <linux/etherdevice.h>
Herbert Xua9ea3fc2008-04-18 11:21:42 +080022#include <linux/ethtool.h>
Rusty Russell296f96f2007-10-22 11:03:37 +100023#include <linux/module.h>
24#include <linux/virtio.h>
25#include <linux/virtio_net.h>
26#include <linux/scatterlist.h>
Alex Williamsone918085a2009-01-25 18:06:26 -080027#include <linux/if_vlan.h>
Rusty Russell296f96f2007-10-22 11:03:37 +100028
Dor Laor6c0cd7c2007-12-16 15:19:43 +020029static int napi_weight = 128;
30module_param(napi_weight, int, 0444);
31
Rusty Russell34a48572008-02-04 23:50:02 -050032static int csum = 1, gso = 1;
33module_param(csum, bool, 0444);
34module_param(gso, bool, 0444);
35
Rusty Russell296f96f2007-10-22 11:03:37 +100036/* FIXME: MTU in config. */
Alex Williamsone918085a2009-01-25 18:06:26 -080037#define MAX_PACKET_LEN (ETH_HLEN + VLAN_HLEN + ETH_DATA_LEN)
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -080038#define GOOD_COPY_LEN 128
Rusty Russell296f96f2007-10-22 11:03:37 +100039
40struct virtnet_info
41{
42 struct virtio_device *vdev;
43 struct virtqueue *rvq, *svq;
44 struct net_device *dev;
45 struct napi_struct napi;
46
Rusty Russell99ffc692008-05-02 21:50:46 -050047 /* The skb we couldn't send because buffers were full. */
48 struct sk_buff *last_xmit_skb;
49
Rusty Russell363f1512008-06-08 20:51:55 +100050 /* If we need to free in a timer, this is it. */
Mark McLoughlin14c998f2008-06-08 20:50:56 +100051 struct timer_list xmit_free_timer;
52
Rusty Russell296f96f2007-10-22 11:03:37 +100053 /* Number of input buffers, and max we've ever had. */
54 unsigned int num, max;
55
Rusty Russell11a3a152008-05-26 17:48:13 +100056 /* For cleaning up after transmission. */
57 struct tasklet_struct tasklet;
Rusty Russell363f1512008-06-08 20:51:55 +100058 bool free_in_tasklet;
Rusty Russell11a3a152008-05-26 17:48:13 +100059
Herbert Xu97402b92008-04-18 11:24:27 +080060 /* I like... big packets and I cannot lie! */
61 bool big_packets;
62
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -080063 /* Host will merge rx buffers for big packets (shake it! shake it!) */
64 bool mergeable_rx_bufs;
65
Rusty Russell296f96f2007-10-22 11:03:37 +100066 /* Receive & send queues. */
67 struct sk_buff_head recv;
68 struct sk_buff_head send;
Rusty Russellfb6813f2008-07-25 12:06:01 -050069
70 /* Chain pages by the private ptr. */
71 struct page *pages;
Rusty Russell296f96f2007-10-22 11:03:37 +100072};
73
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -080074static inline void *skb_vnet_hdr(struct sk_buff *skb)
Rusty Russell296f96f2007-10-22 11:03:37 +100075{
76 return (struct virtio_net_hdr *)skb->cb;
77}
78
Rusty Russellfb6813f2008-07-25 12:06:01 -050079static void give_a_page(struct virtnet_info *vi, struct page *page)
80{
81 page->private = (unsigned long)vi->pages;
82 vi->pages = page;
83}
84
Mark McLoughlin0a888fd2008-11-16 22:39:18 -080085static void trim_pages(struct virtnet_info *vi, struct sk_buff *skb)
86{
87 unsigned int i;
88
89 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++)
90 give_a_page(vi, skb_shinfo(skb)->frags[i].page);
91 skb_shinfo(skb)->nr_frags = 0;
92 skb->data_len = 0;
93}
94
Rusty Russellfb6813f2008-07-25 12:06:01 -050095static struct page *get_a_page(struct virtnet_info *vi, gfp_t gfp_mask)
96{
97 struct page *p = vi->pages;
98
99 if (p)
100 vi->pages = (struct page *)p->private;
101 else
102 p = alloc_page(gfp_mask);
103 return p;
104}
105
Rusty Russell2cb9c6b2008-02-04 23:50:07 -0500106static void skb_xmit_done(struct virtqueue *svq)
Rusty Russell296f96f2007-10-22 11:03:37 +1000107{
Rusty Russell2cb9c6b2008-02-04 23:50:07 -0500108 struct virtnet_info *vi = svq->vdev->priv;
Rusty Russell296f96f2007-10-22 11:03:37 +1000109
Rusty Russell2cb9c6b2008-02-04 23:50:07 -0500110 /* Suppress further interrupts. */
111 svq->vq_ops->disable_cb(svq);
Rusty Russell11a3a152008-05-26 17:48:13 +1000112
Rusty Russell363f1512008-06-08 20:51:55 +1000113 /* We were probably waiting for more output buffers. */
Rusty Russell296f96f2007-10-22 11:03:37 +1000114 netif_wake_queue(vi->dev);
Rusty Russell11a3a152008-05-26 17:48:13 +1000115
116 /* Make sure we re-xmit last_xmit_skb: if there are no more packets
117 * queued, start_xmit won't be called. */
118 tasklet_schedule(&vi->tasklet);
Rusty Russell296f96f2007-10-22 11:03:37 +1000119}
120
121static void receive_skb(struct net_device *dev, struct sk_buff *skb,
122 unsigned len)
123{
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800124 struct virtnet_info *vi = netdev_priv(dev);
Rusty Russell296f96f2007-10-22 11:03:37 +1000125 struct virtio_net_hdr *hdr = skb_vnet_hdr(skb);
Herbert Xu97402b92008-04-18 11:24:27 +0800126 int err;
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800127 int i;
Rusty Russell296f96f2007-10-22 11:03:37 +1000128
129 if (unlikely(len < sizeof(struct virtio_net_hdr) + ETH_HLEN)) {
130 pr_debug("%s: short packet %i\n", dev->name, len);
131 dev->stats.rx_length_errors++;
132 goto drop;
133 }
Rusty Russell296f96f2007-10-22 11:03:37 +1000134
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800135 if (vi->mergeable_rx_bufs) {
136 struct virtio_net_hdr_mrg_rxbuf *mhdr = skb_vnet_hdr(skb);
137 unsigned int copy;
138 char *p = page_address(skb_shinfo(skb)->frags[0].page);
Rusty Russellfb6813f2008-07-25 12:06:01 -0500139
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800140 if (len > PAGE_SIZE)
141 len = PAGE_SIZE;
142 len -= sizeof(struct virtio_net_hdr_mrg_rxbuf);
143
144 memcpy(hdr, p, sizeof(*mhdr));
145 p += sizeof(*mhdr);
146
147 copy = len;
148 if (copy > skb_tailroom(skb))
149 copy = skb_tailroom(skb);
150
151 memcpy(skb_put(skb, copy), p, copy);
152
153 len -= copy;
154
155 if (!len) {
156 give_a_page(vi, skb_shinfo(skb)->frags[0].page);
157 skb_shinfo(skb)->nr_frags--;
158 } else {
159 skb_shinfo(skb)->frags[0].page_offset +=
160 sizeof(*mhdr) + copy;
161 skb_shinfo(skb)->frags[0].size = len;
162 skb->data_len += len;
163 skb->len += len;
164 }
165
166 while (--mhdr->num_buffers) {
167 struct sk_buff *nskb;
168
169 i = skb_shinfo(skb)->nr_frags;
170 if (i >= MAX_SKB_FRAGS) {
171 pr_debug("%s: packet too long %d\n", dev->name,
172 len);
173 dev->stats.rx_length_errors++;
174 goto drop;
175 }
176
177 nskb = vi->rvq->vq_ops->get_buf(vi->rvq, &len);
178 if (!nskb) {
179 pr_debug("%s: rx error: %d buffers missing\n",
180 dev->name, mhdr->num_buffers);
181 dev->stats.rx_length_errors++;
182 goto drop;
183 }
184
185 __skb_unlink(nskb, &vi->recv);
186 vi->num--;
187
188 skb_shinfo(skb)->frags[i] = skb_shinfo(nskb)->frags[0];
189 skb_shinfo(nskb)->nr_frags = 0;
190 kfree_skb(nskb);
191
192 if (len > PAGE_SIZE)
193 len = PAGE_SIZE;
194
195 skb_shinfo(skb)->frags[i].size = len;
196 skb_shinfo(skb)->nr_frags++;
197 skb->data_len += len;
198 skb->len += len;
199 }
200 } else {
201 len -= sizeof(struct virtio_net_hdr);
202
203 if (len <= MAX_PACKET_LEN)
204 trim_pages(vi, skb);
205
206 err = pskb_trim(skb, len);
207 if (err) {
208 pr_debug("%s: pskb_trim failed %i %d\n", dev->name,
209 len, err);
210 dev->stats.rx_dropped++;
211 goto drop;
212 }
Herbert Xu97402b92008-04-18 11:24:27 +0800213 }
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800214
Herbert Xu97402b92008-04-18 11:24:27 +0800215 skb->truesize += skb->data_len;
Rusty Russell296f96f2007-10-22 11:03:37 +1000216 dev->stats.rx_bytes += skb->len;
217 dev->stats.rx_packets++;
218
219 if (hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) {
220 pr_debug("Needs csum!\n");
Rusty Russellf35d9d82008-02-04 23:49:54 -0500221 if (!skb_partial_csum_set(skb,hdr->csum_start,hdr->csum_offset))
Rusty Russell296f96f2007-10-22 11:03:37 +1000222 goto frame_err;
Rusty Russell296f96f2007-10-22 11:03:37 +1000223 }
224
Mark McLoughlin23cde762008-06-08 20:49:00 +1000225 skb->protocol = eth_type_trans(skb, dev);
226 pr_debug("Receiving skb proto 0x%04x len %i type %i\n",
227 ntohs(skb->protocol), skb->len, skb->pkt_type);
228
Rusty Russell296f96f2007-10-22 11:03:37 +1000229 if (hdr->gso_type != VIRTIO_NET_HDR_GSO_NONE) {
230 pr_debug("GSO!\n");
Rusty Russell34a48572008-02-04 23:50:02 -0500231 switch (hdr->gso_type & ~VIRTIO_NET_HDR_GSO_ECN) {
Rusty Russell296f96f2007-10-22 11:03:37 +1000232 case VIRTIO_NET_HDR_GSO_TCPV4:
233 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
234 break;
Rusty Russell296f96f2007-10-22 11:03:37 +1000235 case VIRTIO_NET_HDR_GSO_UDP:
236 skb_shinfo(skb)->gso_type = SKB_GSO_UDP;
237 break;
238 case VIRTIO_NET_HDR_GSO_TCPV6:
239 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
240 break;
241 default:
242 if (net_ratelimit())
243 printk(KERN_WARNING "%s: bad gso type %u.\n",
244 dev->name, hdr->gso_type);
245 goto frame_err;
246 }
247
Rusty Russell34a48572008-02-04 23:50:02 -0500248 if (hdr->gso_type & VIRTIO_NET_HDR_GSO_ECN)
249 skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_ECN;
250
Rusty Russell296f96f2007-10-22 11:03:37 +1000251 skb_shinfo(skb)->gso_size = hdr->gso_size;
252 if (skb_shinfo(skb)->gso_size == 0) {
253 if (net_ratelimit())
254 printk(KERN_WARNING "%s: zero gso size.\n",
255 dev->name);
256 goto frame_err;
257 }
258
259 /* Header must be checked, and gso_segs computed. */
260 skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
261 skb_shinfo(skb)->gso_segs = 0;
262 }
263
264 netif_receive_skb(skb);
265 return;
266
267frame_err:
268 dev->stats.rx_frame_errors++;
269drop:
270 dev_kfree_skb(skb);
271}
272
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800273static void try_fill_recv_maxbufs(struct virtnet_info *vi)
Rusty Russell296f96f2007-10-22 11:03:37 +1000274{
275 struct sk_buff *skb;
Rusty Russell05271682008-05-02 21:50:45 -0500276 struct scatterlist sg[2+MAX_SKB_FRAGS];
Herbert Xu97402b92008-04-18 11:24:27 +0800277 int num, err, i;
Rusty Russell296f96f2007-10-22 11:03:37 +1000278
Rusty Russell05271682008-05-02 21:50:45 -0500279 sg_init_table(sg, 2+MAX_SKB_FRAGS);
Rusty Russell296f96f2007-10-22 11:03:37 +1000280 for (;;) {
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800281 struct virtio_net_hdr *hdr;
282
Rusty Russell296f96f2007-10-22 11:03:37 +1000283 skb = netdev_alloc_skb(vi->dev, MAX_PACKET_LEN);
284 if (unlikely(!skb))
285 break;
286
287 skb_put(skb, MAX_PACKET_LEN);
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800288
289 hdr = skb_vnet_hdr(skb);
Ira W. Snyder8527bec2009-01-26 21:00:33 -0800290 sg_set_buf(sg, hdr, sizeof(*hdr));
Herbert Xu97402b92008-04-18 11:24:27 +0800291
292 if (vi->big_packets) {
293 for (i = 0; i < MAX_SKB_FRAGS; i++) {
294 skb_frag_t *f = &skb_shinfo(skb)->frags[i];
Rusty Russellfb6813f2008-07-25 12:06:01 -0500295 f->page = get_a_page(vi, GFP_ATOMIC);
Herbert Xu97402b92008-04-18 11:24:27 +0800296 if (!f->page)
297 break;
298
299 f->page_offset = 0;
300 f->size = PAGE_SIZE;
301
302 skb->data_len += PAGE_SIZE;
303 skb->len += PAGE_SIZE;
304
305 skb_shinfo(skb)->nr_frags++;
306 }
307 }
308
Rusty Russell296f96f2007-10-22 11:03:37 +1000309 num = skb_to_sgvec(skb, sg+1, 0, skb->len) + 1;
310 skb_queue_head(&vi->recv, skb);
311
312 err = vi->rvq->vq_ops->add_buf(vi->rvq, sg, 0, num, skb);
313 if (err) {
314 skb_unlink(skb, &vi->recv);
Mark McLoughlin0a888fd2008-11-16 22:39:18 -0800315 trim_pages(vi, skb);
Rusty Russell296f96f2007-10-22 11:03:37 +1000316 kfree_skb(skb);
317 break;
318 }
319 vi->num++;
320 }
321 if (unlikely(vi->num > vi->max))
322 vi->max = vi->num;
323 vi->rvq->vq_ops->kick(vi->rvq);
324}
325
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800326static void try_fill_recv(struct virtnet_info *vi)
327{
328 struct sk_buff *skb;
329 struct scatterlist sg[1];
330 int err;
331
332 if (!vi->mergeable_rx_bufs) {
333 try_fill_recv_maxbufs(vi);
334 return;
335 }
336
337 for (;;) {
338 skb_frag_t *f;
339
340 skb = netdev_alloc_skb(vi->dev, GOOD_COPY_LEN + NET_IP_ALIGN);
341 if (unlikely(!skb))
342 break;
343
344 skb_reserve(skb, NET_IP_ALIGN);
345
346 f = &skb_shinfo(skb)->frags[0];
347 f->page = get_a_page(vi, GFP_ATOMIC);
348 if (!f->page) {
349 kfree_skb(skb);
350 break;
351 }
352
353 f->page_offset = 0;
354 f->size = PAGE_SIZE;
355
356 skb_shinfo(skb)->nr_frags++;
357
358 sg_init_one(sg, page_address(f->page), PAGE_SIZE);
359 skb_queue_head(&vi->recv, skb);
360
361 err = vi->rvq->vq_ops->add_buf(vi->rvq, sg, 0, 1, skb);
362 if (err) {
363 skb_unlink(skb, &vi->recv);
364 kfree_skb(skb);
365 break;
366 }
367 vi->num++;
368 }
369 if (unlikely(vi->num > vi->max))
370 vi->max = vi->num;
371 vi->rvq->vq_ops->kick(vi->rvq);
372}
373
Rusty Russell18445c42008-02-04 23:49:57 -0500374static void skb_recv_done(struct virtqueue *rvq)
Rusty Russell296f96f2007-10-22 11:03:37 +1000375{
376 struct virtnet_info *vi = rvq->vdev->priv;
Rusty Russell18445c42008-02-04 23:49:57 -0500377 /* Schedule NAPI, Suppress further interrupts if successful. */
Neil Horman908a7a12008-12-22 20:43:12 -0800378 if (netif_rx_schedule_prep(&vi->napi)) {
Rusty Russell18445c42008-02-04 23:49:57 -0500379 rvq->vq_ops->disable_cb(rvq);
Neil Horman908a7a12008-12-22 20:43:12 -0800380 __netif_rx_schedule(&vi->napi);
Rusty Russell18445c42008-02-04 23:49:57 -0500381 }
Rusty Russell296f96f2007-10-22 11:03:37 +1000382}
383
384static int virtnet_poll(struct napi_struct *napi, int budget)
385{
386 struct virtnet_info *vi = container_of(napi, struct virtnet_info, napi);
387 struct sk_buff *skb = NULL;
388 unsigned int len, received = 0;
389
390again:
391 while (received < budget &&
392 (skb = vi->rvq->vq_ops->get_buf(vi->rvq, &len)) != NULL) {
393 __skb_unlink(skb, &vi->recv);
394 receive_skb(vi->dev, skb, len);
395 vi->num--;
396 received++;
397 }
398
399 /* FIXME: If we oom and completely run out of inbufs, we need
400 * to start a timer trying to fill more. */
401 if (vi->num < vi->max / 2)
402 try_fill_recv(vi);
403
Rusty Russell8329d982007-11-19 11:20:43 -0500404 /* Out of packets? */
405 if (received < budget) {
Neil Horman908a7a12008-12-22 20:43:12 -0800406 netif_rx_complete(napi);
Rusty Russell18445c42008-02-04 23:49:57 -0500407 if (unlikely(!vi->rvq->vq_ops->enable_cb(vi->rvq))
Christian Borntraeger4265f162008-03-14 14:17:05 +0100408 && napi_schedule_prep(napi)) {
409 vi->rvq->vq_ops->disable_cb(vi->rvq);
Neil Horman908a7a12008-12-22 20:43:12 -0800410 __netif_rx_schedule(napi);
Rusty Russell296f96f2007-10-22 11:03:37 +1000411 goto again;
Christian Borntraeger4265f162008-03-14 14:17:05 +0100412 }
Rusty Russell296f96f2007-10-22 11:03:37 +1000413 }
414
415 return received;
416}
417
418static void free_old_xmit_skbs(struct virtnet_info *vi)
419{
420 struct sk_buff *skb;
421 unsigned int len;
422
423 while ((skb = vi->svq->vq_ops->get_buf(vi->svq, &len)) != NULL) {
424 pr_debug("Sent skb %p\n", skb);
425 __skb_unlink(skb, &vi->send);
Rusty Russell655aa312008-05-02 21:50:43 -0500426 vi->dev->stats.tx_bytes += skb->len;
Rusty Russell296f96f2007-10-22 11:03:37 +1000427 vi->dev->stats.tx_packets++;
428 kfree_skb(skb);
429 }
430}
431
Rusty Russell363f1512008-06-08 20:51:55 +1000432/* If the virtio transport doesn't always notify us when all in-flight packets
433 * are consumed, we fall back to using this function on a timer to free them. */
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000434static void xmit_free(unsigned long data)
435{
436 struct virtnet_info *vi = (void *)data;
437
438 netif_tx_lock(vi->dev);
439
440 free_old_xmit_skbs(vi);
441
442 if (!skb_queue_empty(&vi->send))
443 mod_timer(&vi->xmit_free_timer, jiffies + (HZ/10));
444
445 netif_tx_unlock(vi->dev);
446}
447
Rusty Russell99ffc692008-05-02 21:50:46 -0500448static int xmit_skb(struct virtnet_info *vi, struct sk_buff *skb)
Rusty Russell296f96f2007-10-22 11:03:37 +1000449{
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000450 int num, err;
Rusty Russell05271682008-05-02 21:50:45 -0500451 struct scatterlist sg[2+MAX_SKB_FRAGS];
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800452 struct virtio_net_hdr_mrg_rxbuf *mhdr = skb_vnet_hdr(skb);
453 struct virtio_net_hdr *hdr = skb_vnet_hdr(skb);
Rusty Russell296f96f2007-10-22 11:03:37 +1000454 const unsigned char *dest = ((struct ethhdr *)skb->data)->h_dest;
Rusty Russell296f96f2007-10-22 11:03:37 +1000455
Rusty Russell05271682008-05-02 21:50:45 -0500456 sg_init_table(sg, 2+MAX_SKB_FRAGS);
Rusty Russell4d125de2007-11-07 16:34:49 +1100457
Johannes Berge1749612008-10-27 15:59:26 -0700458 pr_debug("%s: xmit %p %pM\n", vi->dev->name, skb, dest);
Rusty Russell296f96f2007-10-22 11:03:37 +1000459
Rusty Russell296f96f2007-10-22 11:03:37 +1000460 if (skb->ip_summed == CHECKSUM_PARTIAL) {
461 hdr->flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
462 hdr->csum_start = skb->csum_start - skb_headroom(skb);
463 hdr->csum_offset = skb->csum_offset;
464 } else {
465 hdr->flags = 0;
466 hdr->csum_offset = hdr->csum_start = 0;
467 }
468
469 if (skb_is_gso(skb)) {
Rusty Russell50c8ea82008-02-04 23:50:01 -0500470 hdr->hdr_len = skb_transport_header(skb) - skb->data;
Rusty Russell296f96f2007-10-22 11:03:37 +1000471 hdr->gso_size = skb_shinfo(skb)->gso_size;
Rusty Russell34a48572008-02-04 23:50:02 -0500472 if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4)
Rusty Russell296f96f2007-10-22 11:03:37 +1000473 hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
474 else if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6)
475 hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
476 else if (skb_shinfo(skb)->gso_type & SKB_GSO_UDP)
477 hdr->gso_type = VIRTIO_NET_HDR_GSO_UDP;
478 else
479 BUG();
Rusty Russell34a48572008-02-04 23:50:02 -0500480 if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_ECN)
481 hdr->gso_type |= VIRTIO_NET_HDR_GSO_ECN;
Rusty Russell296f96f2007-10-22 11:03:37 +1000482 } else {
483 hdr->gso_type = VIRTIO_NET_HDR_GSO_NONE;
Rusty Russell50c8ea82008-02-04 23:50:01 -0500484 hdr->gso_size = hdr->hdr_len = 0;
Rusty Russell296f96f2007-10-22 11:03:37 +1000485 }
486
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800487 mhdr->num_buffers = 0;
488
489 /* Encode metadata header at front. */
490 if (vi->mergeable_rx_bufs)
Ira W. Snyder8527bec2009-01-26 21:00:33 -0800491 sg_set_buf(sg, mhdr, sizeof(*mhdr));
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800492 else
Ira W. Snyder8527bec2009-01-26 21:00:33 -0800493 sg_set_buf(sg, hdr, sizeof(*hdr));
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800494
Rusty Russell296f96f2007-10-22 11:03:37 +1000495 num = skb_to_sgvec(skb, sg+1, 0, skb->len) + 1;
Rusty Russell99ffc692008-05-02 21:50:46 -0500496
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000497 err = vi->svq->vq_ops->add_buf(vi->svq, sg, num, 0, skb);
Rusty Russell363f1512008-06-08 20:51:55 +1000498 if (!err && !vi->free_in_tasklet)
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000499 mod_timer(&vi->xmit_free_timer, jiffies + (HZ/10));
500
501 return err;
Rusty Russell99ffc692008-05-02 21:50:46 -0500502}
503
Rusty Russell11a3a152008-05-26 17:48:13 +1000504static void xmit_tasklet(unsigned long data)
505{
506 struct virtnet_info *vi = (void *)data;
507
508 netif_tx_lock_bh(vi->dev);
509 if (vi->last_xmit_skb && xmit_skb(vi, vi->last_xmit_skb) == 0) {
510 vi->svq->vq_ops->kick(vi->svq);
511 vi->last_xmit_skb = NULL;
512 }
Rusty Russell363f1512008-06-08 20:51:55 +1000513 if (vi->free_in_tasklet)
514 free_old_xmit_skbs(vi);
Rusty Russell11a3a152008-05-26 17:48:13 +1000515 netif_tx_unlock_bh(vi->dev);
516}
517
Rusty Russell99ffc692008-05-02 21:50:46 -0500518static int start_xmit(struct sk_buff *skb, struct net_device *dev)
519{
520 struct virtnet_info *vi = netdev_priv(dev);
Rusty Russell2cb9c6b2008-02-04 23:50:07 -0500521
522again:
523 /* Free up any pending old buffers before queueing new ones. */
524 free_old_xmit_skbs(vi);
Rusty Russell2cb9c6b2008-02-04 23:50:07 -0500525
Rusty Russell99ffc692008-05-02 21:50:46 -0500526 /* If we has a buffer left over from last time, send it now. */
Mark McLoughlin9953ca62008-05-27 12:06:26 +0100527 if (unlikely(vi->last_xmit_skb) &&
528 xmit_skb(vi, vi->last_xmit_skb) != 0)
529 goto stop_queue;
530
531 vi->last_xmit_skb = NULL;
Rusty Russell296f96f2007-10-22 11:03:37 +1000532
Rusty Russell99ffc692008-05-02 21:50:46 -0500533 /* Put new one in send queue and do transmit */
Rusty Russell7eb2e252008-05-26 17:42:42 +1000534 if (likely(skb)) {
535 __skb_queue_head(&vi->send, skb);
536 if (xmit_skb(vi, skb) != 0) {
537 vi->last_xmit_skb = skb;
538 skb = NULL;
539 goto stop_queue;
540 }
Rusty Russell99ffc692008-05-02 21:50:46 -0500541 }
542done:
543 vi->svq->vq_ops->kick(vi->svq);
544 return NETDEV_TX_OK;
545
546stop_queue:
547 pr_debug("%s: virtio not prepared to send\n", dev->name);
548 netif_stop_queue(dev);
549
550 /* Activate callback for using skbs: if this returns false it
551 * means some were used in the meantime. */
552 if (unlikely(!vi->svq->vq_ops->enable_cb(vi->svq))) {
553 vi->svq->vq_ops->disable_cb(vi->svq);
554 netif_start_queue(dev);
555 goto again;
556 }
Mark McLoughlin9953ca62008-05-27 12:06:26 +0100557 if (skb) {
558 /* Drop this skb: we only queue one. */
559 vi->dev->stats.tx_dropped++;
560 kfree_skb(skb);
561 }
Rusty Russell99ffc692008-05-02 21:50:46 -0500562 goto done;
Rusty Russell296f96f2007-10-22 11:03:37 +1000563}
564
Amit Shahda74e892008-02-29 16:24:50 +0530565#ifdef CONFIG_NET_POLL_CONTROLLER
566static void virtnet_netpoll(struct net_device *dev)
567{
568 struct virtnet_info *vi = netdev_priv(dev);
569
570 napi_schedule(&vi->napi);
571}
572#endif
573
Rusty Russell296f96f2007-10-22 11:03:37 +1000574static int virtnet_open(struct net_device *dev)
575{
576 struct virtnet_info *vi = netdev_priv(dev);
577
Rusty Russell296f96f2007-10-22 11:03:37 +1000578 napi_enable(&vi->napi);
Rusty Russella48bd8f2008-02-04 23:50:07 -0500579
580 /* If all buffers were filled by other side before we napi_enabled, we
581 * won't get another interrupt, so process any outstanding packets
Christian Borntraeger370076d2008-02-06 08:50:11 +0100582 * now. virtnet_poll wants re-enable the queue, so we disable here.
583 * We synchronize against interrupts via NAPI_STATE_SCHED */
Neil Horman908a7a12008-12-22 20:43:12 -0800584 if (netif_rx_schedule_prep(&vi->napi)) {
Christian Borntraeger370076d2008-02-06 08:50:11 +0100585 vi->rvq->vq_ops->disable_cb(vi->rvq);
Neil Horman908a7a12008-12-22 20:43:12 -0800586 __netif_rx_schedule(&vi->napi);
Christian Borntraeger370076d2008-02-06 08:50:11 +0100587 }
Rusty Russell296f96f2007-10-22 11:03:37 +1000588 return 0;
589}
590
591static int virtnet_close(struct net_device *dev)
592{
593 struct virtnet_info *vi = netdev_priv(dev);
Rusty Russell296f96f2007-10-22 11:03:37 +1000594
595 napi_disable(&vi->napi);
596
Rusty Russell296f96f2007-10-22 11:03:37 +1000597 return 0;
598}
599
Herbert Xua9ea3fc2008-04-18 11:21:42 +0800600static int virtnet_set_tx_csum(struct net_device *dev, u32 data)
601{
602 struct virtnet_info *vi = netdev_priv(dev);
603 struct virtio_device *vdev = vi->vdev;
604
605 if (data && !virtio_has_feature(vdev, VIRTIO_NET_F_CSUM))
606 return -ENOSYS;
607
608 return ethtool_op_set_tx_hw_csum(dev, data);
609}
610
611static struct ethtool_ops virtnet_ethtool_ops = {
612 .set_tx_csum = virtnet_set_tx_csum,
613 .set_sg = ethtool_op_set_sg,
Mark McLoughlin0276b492008-11-16 22:40:36 -0800614 .set_tso = ethtool_op_set_tso,
Herbert Xua9ea3fc2008-04-18 11:21:42 +0800615};
616
Mark McLoughlin39da5812008-11-26 13:58:11 +0000617#define MIN_MTU 68
618#define MAX_MTU 65535
619
620static int virtnet_change_mtu(struct net_device *dev, int new_mtu)
621{
622 if (new_mtu < MIN_MTU || new_mtu > MAX_MTU)
623 return -EINVAL;
624 dev->mtu = new_mtu;
625 return 0;
626}
627
Stephen Hemminger76288b42009-01-06 10:44:22 -0800628static const struct net_device_ops virtnet_netdev = {
629 .ndo_open = virtnet_open,
630 .ndo_stop = virtnet_close,
631 .ndo_start_xmit = start_xmit,
632 .ndo_validate_addr = eth_validate_addr,
633 .ndo_set_mac_address = eth_mac_addr,
634 .ndo_change_mtu = virtnet_change_mtu,
635#ifdef CONFIG_NET_POLL_CONTROLLER
636 .ndo_poll_controller = virtnet_netpoll,
637#endif
638};
639
Rusty Russell296f96f2007-10-22 11:03:37 +1000640static int virtnet_probe(struct virtio_device *vdev)
641{
642 int err;
Rusty Russell296f96f2007-10-22 11:03:37 +1000643 struct net_device *dev;
644 struct virtnet_info *vi;
Rusty Russell296f96f2007-10-22 11:03:37 +1000645
646 /* Allocate ourselves a network device with room for our info */
647 dev = alloc_etherdev(sizeof(struct virtnet_info));
648 if (!dev)
649 return -ENOMEM;
650
651 /* Set up network device as normal. */
Stephen Hemminger76288b42009-01-06 10:44:22 -0800652 dev->netdev_ops = &virtnet_netdev;
Rusty Russell296f96f2007-10-22 11:03:37 +1000653 dev->features = NETIF_F_HIGHDMA;
Herbert Xua9ea3fc2008-04-18 11:21:42 +0800654 SET_ETHTOOL_OPS(dev, &virtnet_ethtool_ops);
Rusty Russell296f96f2007-10-22 11:03:37 +1000655 SET_NETDEV_DEV(dev, &vdev->dev);
656
657 /* Do we support "hardware" checksums? */
Rusty Russellc45a6812008-05-02 21:50:50 -0500658 if (csum && virtio_has_feature(vdev, VIRTIO_NET_F_CSUM)) {
Rusty Russell296f96f2007-10-22 11:03:37 +1000659 /* This opens up the world of extra features. */
660 dev->features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;
Rusty Russellc45a6812008-05-02 21:50:50 -0500661 if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_GSO)) {
Rusty Russell34a48572008-02-04 23:50:02 -0500662 dev->features |= NETIF_F_TSO | NETIF_F_UFO
663 | NETIF_F_TSO_ECN | NETIF_F_TSO6;
664 }
Rusty Russell5539ae962008-05-02 21:50:46 -0500665 /* Individual feature bits: what can host handle? */
Rusty Russellc45a6812008-05-02 21:50:50 -0500666 if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO4))
Rusty Russell5539ae962008-05-02 21:50:46 -0500667 dev->features |= NETIF_F_TSO;
Rusty Russellc45a6812008-05-02 21:50:50 -0500668 if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO6))
Rusty Russell5539ae962008-05-02 21:50:46 -0500669 dev->features |= NETIF_F_TSO6;
Rusty Russellc45a6812008-05-02 21:50:50 -0500670 if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_ECN))
Rusty Russell5539ae962008-05-02 21:50:46 -0500671 dev->features |= NETIF_F_TSO_ECN;
Rusty Russellc45a6812008-05-02 21:50:50 -0500672 if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_UFO))
Rusty Russell5539ae962008-05-02 21:50:46 -0500673 dev->features |= NETIF_F_UFO;
Rusty Russell296f96f2007-10-22 11:03:37 +1000674 }
675
676 /* Configuration may specify what MAC to use. Otherwise random. */
Rusty Russellc45a6812008-05-02 21:50:50 -0500677 if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC)) {
Rusty Russella586d4f2008-02-04 23:49:56 -0500678 vdev->config->get(vdev,
679 offsetof(struct virtio_net_config, mac),
680 dev->dev_addr, dev->addr_len);
Rusty Russell296f96f2007-10-22 11:03:37 +1000681 } else
682 random_ether_addr(dev->dev_addr);
683
684 /* Set up our device-specific information */
685 vi = netdev_priv(dev);
Dor Laor6c0cd7c2007-12-16 15:19:43 +0200686 netif_napi_add(dev, &vi->napi, virtnet_poll, napi_weight);
Rusty Russell296f96f2007-10-22 11:03:37 +1000687 vi->dev = dev;
688 vi->vdev = vdev;
Christian Borntraegerd9d5dcc2008-02-18 10:02:51 +0100689 vdev->priv = vi;
Rusty Russellfb6813f2008-07-25 12:06:01 -0500690 vi->pages = NULL;
Rusty Russell296f96f2007-10-22 11:03:37 +1000691
Rusty Russell363f1512008-06-08 20:51:55 +1000692 /* If they give us a callback when all buffers are done, we don't need
693 * the timer. */
694 vi->free_in_tasklet = virtio_has_feature(vdev,VIRTIO_F_NOTIFY_ON_EMPTY);
695
Herbert Xu97402b92008-04-18 11:24:27 +0800696 /* If we can receive ANY GSO packets, we must allocate large ones. */
697 if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO4)
698 || virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO6)
699 || virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_ECN))
700 vi->big_packets = true;
701
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800702 if (virtio_has_feature(vdev, VIRTIO_NET_F_MRG_RXBUF))
703 vi->mergeable_rx_bufs = true;
704
Rusty Russell296f96f2007-10-22 11:03:37 +1000705 /* We expect two virtqueues, receive then send. */
Rusty Russella586d4f2008-02-04 23:49:56 -0500706 vi->rvq = vdev->config->find_vq(vdev, 0, skb_recv_done);
Rusty Russell296f96f2007-10-22 11:03:37 +1000707 if (IS_ERR(vi->rvq)) {
708 err = PTR_ERR(vi->rvq);
709 goto free;
710 }
711
Rusty Russella586d4f2008-02-04 23:49:56 -0500712 vi->svq = vdev->config->find_vq(vdev, 1, skb_xmit_done);
Rusty Russell296f96f2007-10-22 11:03:37 +1000713 if (IS_ERR(vi->svq)) {
714 err = PTR_ERR(vi->svq);
715 goto free_recv;
716 }
717
718 /* Initialize our empty receive and send queues. */
719 skb_queue_head_init(&vi->recv);
720 skb_queue_head_init(&vi->send);
721
Rusty Russell11a3a152008-05-26 17:48:13 +1000722 tasklet_init(&vi->tasklet, xmit_tasklet, (unsigned long)vi);
723
Rusty Russell363f1512008-06-08 20:51:55 +1000724 if (!vi->free_in_tasklet)
725 setup_timer(&vi->xmit_free_timer, xmit_free, (unsigned long)vi);
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000726
Rusty Russell296f96f2007-10-22 11:03:37 +1000727 err = register_netdev(dev);
728 if (err) {
729 pr_debug("virtio_net: registering device failed\n");
730 goto free_send;
731 }
Rusty Russellb3369c12008-02-04 23:50:02 -0500732
733 /* Last of all, set up some receive buffers. */
734 try_fill_recv(vi);
735
736 /* If we didn't even get one input buffer, we're useless. */
737 if (vi->num == 0) {
738 err = -ENOMEM;
739 goto unregister;
740 }
741
Rusty Russell296f96f2007-10-22 11:03:37 +1000742 pr_debug("virtnet: registered device %s\n", dev->name);
Rusty Russell296f96f2007-10-22 11:03:37 +1000743 return 0;
744
Rusty Russellb3369c12008-02-04 23:50:02 -0500745unregister:
746 unregister_netdev(dev);
Rusty Russell296f96f2007-10-22 11:03:37 +1000747free_send:
748 vdev->config->del_vq(vi->svq);
749free_recv:
750 vdev->config->del_vq(vi->rvq);
751free:
752 free_netdev(dev);
753 return err;
754}
755
756static void virtnet_remove(struct virtio_device *vdev)
757{
Rusty Russell74b25532007-11-19 11:20:42 -0500758 struct virtnet_info *vi = vdev->priv;
Rusty Russellb3369c12008-02-04 23:50:02 -0500759 struct sk_buff *skb;
760
Rusty Russell6e5aa7e2008-02-04 23:50:03 -0500761 /* Stop all the virtqueues. */
762 vdev->config->reset(vdev);
763
Rusty Russell363f1512008-06-08 20:51:55 +1000764 if (!vi->free_in_tasklet)
765 del_timer_sync(&vi->xmit_free_timer);
Mark McLoughlin14c998f2008-06-08 20:50:56 +1000766
Rusty Russellb3369c12008-02-04 23:50:02 -0500767 /* Free our skbs in send and recv queues, if any. */
Rusty Russellb3369c12008-02-04 23:50:02 -0500768 while ((skb = __skb_dequeue(&vi->recv)) != NULL) {
769 kfree_skb(skb);
770 vi->num--;
771 }
Wang Chen288369c2008-05-22 18:07:43 +0800772 __skb_queue_purge(&vi->send);
Rusty Russellb3369c12008-02-04 23:50:02 -0500773
774 BUG_ON(vi->num != 0);
Rusty Russell74b25532007-11-19 11:20:42 -0500775
776 vdev->config->del_vq(vi->svq);
777 vdev->config->del_vq(vi->rvq);
778 unregister_netdev(vi->dev);
Rusty Russellfb6813f2008-07-25 12:06:01 -0500779
780 while (vi->pages)
781 __free_pages(get_a_page(vi, GFP_KERNEL), 0);
782
Rusty Russell74b25532007-11-19 11:20:42 -0500783 free_netdev(vi->dev);
Rusty Russell296f96f2007-10-22 11:03:37 +1000784}
785
786static struct virtio_device_id id_table[] = {
787 { VIRTIO_ID_NET, VIRTIO_DEV_ANY_ID },
788 { 0 },
789};
790
Rusty Russellc45a6812008-05-02 21:50:50 -0500791static unsigned int features[] = {
Mark McLoughlin5e4fe5c2008-07-08 17:10:42 +1000792 VIRTIO_NET_F_CSUM, VIRTIO_NET_F_GUEST_CSUM,
793 VIRTIO_NET_F_GSO, VIRTIO_NET_F_MAC,
Rusty Russellc45a6812008-05-02 21:50:50 -0500794 VIRTIO_NET_F_HOST_TSO4, VIRTIO_NET_F_HOST_UFO, VIRTIO_NET_F_HOST_TSO6,
Herbert Xu97402b92008-04-18 11:24:27 +0800795 VIRTIO_NET_F_HOST_ECN, VIRTIO_NET_F_GUEST_TSO4, VIRTIO_NET_F_GUEST_TSO6,
796 VIRTIO_NET_F_GUEST_ECN, /* We don't yet handle UFO input. */
Mark McLoughlin3f2c31d2008-11-16 22:41:34 -0800797 VIRTIO_NET_F_MRG_RXBUF,
Herbert Xu97402b92008-04-18 11:24:27 +0800798 VIRTIO_F_NOTIFY_ON_EMPTY,
Rusty Russellc45a6812008-05-02 21:50:50 -0500799};
800
Rusty Russell296f96f2007-10-22 11:03:37 +1000801static struct virtio_driver virtio_net = {
Rusty Russellc45a6812008-05-02 21:50:50 -0500802 .feature_table = features,
803 .feature_table_size = ARRAY_SIZE(features),
Rusty Russell296f96f2007-10-22 11:03:37 +1000804 .driver.name = KBUILD_MODNAME,
805 .driver.owner = THIS_MODULE,
806 .id_table = id_table,
807 .probe = virtnet_probe,
808 .remove = __devexit_p(virtnet_remove),
809};
810
811static int __init init(void)
812{
813 return register_virtio_driver(&virtio_net);
814}
815
816static void __exit fini(void)
817{
818 unregister_virtio_driver(&virtio_net);
819}
820module_init(init);
821module_exit(fini);
822
823MODULE_DEVICE_TABLE(virtio, id_table);
824MODULE_DESCRIPTION("Virtio network driver");
825MODULE_LICENSE("GPL");