blob: 97f7f535f41208cfcb695bd7d8f7d7b1f928c13b [file] [log] [blame]
Ed L. Cashin26114642006-09-20 14:36:48 -04001/* Copyright (c) 2006 Coraid, Inc. See COPYING for GPL terms. */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * aoecmd.c
4 * Filesystem request handling methods
5 */
6
7#include <linux/hdreg.h>
8#include <linux/blkdev.h>
9#include <linux/skbuff.h>
10#include <linux/netdevice.h>
Ed L. Cashin3ae1c242006-01-19 13:46:19 -050011#include <linux/genhd.h>
Ed L. Cashin475172f2005-09-29 12:47:40 -040012#include <asm/unaligned.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include "aoe.h"
14
15#define TIMERTICK (HZ / 10)
16#define MINTIMER (2 * TIMERTICK)
17#define MAXTIMER (HZ << 1)
Ed L. Cashinb751e8b2006-09-20 14:36:50 -040018
19static int aoe_deadsecs = 60 * 3;
20module_param(aoe_deadsecs, int, 0644);
21MODULE_PARM_DESC(aoe_deadsecs, "After aoe_deadsecs seconds, give up and fail dev.");
Linus Torvalds1da177e2005-04-16 15:20:36 -070022
Ed L. Cashine407a7f2006-09-20 14:36:49 -040023struct sk_buff *
24new_skb(ulong len)
Linus Torvalds1da177e2005-04-16 15:20:36 -070025{
26 struct sk_buff *skb;
27
28 skb = alloc_skb(len, GFP_ATOMIC);
29 if (skb) {
30 skb->nh.raw = skb->mac.raw = skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031 skb->protocol = __constant_htons(ETH_P_AOE);
32 skb->priority = 0;
33 skb_put(skb, len);
Ed L. Cashin50bba752006-01-19 12:37:24 -050034 memset(skb->head, 0, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -070035 skb->next = skb->prev = NULL;
36
37 /* tell the network layer not to perform IP checksums
38 * or to get the NIC to do it
39 */
40 skb->ip_summed = CHECKSUM_NONE;
41 }
42 return skb;
43}
44
Linus Torvalds1da177e2005-04-16 15:20:36 -070045static struct frame *
46getframe(struct aoedev *d, int tag)
47{
48 struct frame *f, *e;
49
50 f = d->frames;
51 e = f + d->nframes;
52 for (; f<e; f++)
53 if (f->tag == tag)
54 return f;
55 return NULL;
56}
57
58/*
59 * Leave the top bit clear so we have tagspace for userland.
60 * The bottom 16 bits are the xmit tick for rexmit/rttavg processing.
61 * This driver reserves tag -1 to mean "unused frame."
62 */
63static int
64newtag(struct aoedev *d)
65{
66 register ulong n;
67
68 n = jiffies & 0xffff;
69 return n |= (++d->lasttag & 0x7fff) << 16;
70}
71
72static int
73aoehdr_atainit(struct aoedev *d, struct aoe_hdr *h)
74{
Linus Torvalds1da177e2005-04-16 15:20:36 -070075 u32 host_tag = newtag(d);
Linus Torvalds1da177e2005-04-16 15:20:36 -070076
77 memcpy(h->src, d->ifp->dev_addr, sizeof h->src);
78 memcpy(h->dst, d->addr, sizeof h->dst);
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -070079 h->type = __constant_cpu_to_be16(ETH_P_AOE);
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 h->verfl = AOE_HVER;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -070081 h->major = cpu_to_be16(d->aoemajor);
Linus Torvalds1da177e2005-04-16 15:20:36 -070082 h->minor = d->aoeminor;
83 h->cmd = AOECMD_ATA;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -070084 h->tag = cpu_to_be32(host_tag);
Linus Torvalds1da177e2005-04-16 15:20:36 -070085
86 return host_tag;
87}
88
Ed L. Cashin19bf2632006-09-20 14:36:49 -040089static inline void
90put_lba(struct aoe_atahdr *ah, sector_t lba)
91{
92 ah->lba0 = lba;
93 ah->lba1 = lba >>= 8;
94 ah->lba2 = lba >>= 8;
95 ah->lba3 = lba >>= 8;
96 ah->lba4 = lba >>= 8;
97 ah->lba5 = lba >>= 8;
98}
99
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100static void
101aoecmd_ata_rw(struct aoedev *d, struct frame *f)
102{
103 struct aoe_hdr *h;
104 struct aoe_atahdr *ah;
105 struct buf *buf;
106 struct sk_buff *skb;
107 ulong bcnt;
108 register sector_t sector;
109 char writebit, extbit;
110
111 writebit = 0x10;
112 extbit = 0x4;
113
114 buf = d->inprocess;
115
116 sector = buf->sector;
117 bcnt = buf->bv_resid;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400118 if (bcnt > d->maxbcnt)
119 bcnt = d->maxbcnt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
121 /* initialize the headers & frame */
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400122 skb = f->skb;
123 h = (struct aoe_hdr *) skb->mac.raw;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 ah = (struct aoe_atahdr *) (h+1);
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400125 skb->len = sizeof *h + sizeof *ah;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400126 memset(h, 0, ETH_ZLEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 f->tag = aoehdr_atainit(d, h);
128 f->waited = 0;
129 f->buf = buf;
130 f->bufaddr = buf->bufaddr;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400131 f->bcnt = bcnt;
132 f->lba = sector;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133
134 /* set up ata header */
135 ah->scnt = bcnt >> 9;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400136 put_lba(ah, sector);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 if (d->flags & DEVFL_EXT) {
138 ah->aflags |= AOEAFL_EXT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 } else {
140 extbit = 0;
141 ah->lba3 &= 0x0f;
142 ah->lba3 |= 0xe0; /* LBA bit + obsolete 0xa0 */
143 }
144
145 if (bio_data_dir(buf->bio) == WRITE) {
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400146 skb_fill_page_desc(skb, 0, virt_to_page(f->bufaddr),
147 offset_in_page(f->bufaddr), bcnt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 ah->aflags |= AOEAFL_WRITE;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400149 skb->len += bcnt;
150 skb->data_len = bcnt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 } else {
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400152 skb->len = ETH_ZLEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 writebit = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 }
155
156 ah->cmdstat = WIN_READ | writebit | extbit;
157
158 /* mark all tracking fields and load out */
159 buf->nframesout += 1;
160 buf->bufaddr += bcnt;
161 buf->bv_resid -= bcnt;
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400162/* printk(KERN_DEBUG "aoe: bv_resid=%ld\n", buf->bv_resid); */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 buf->resid -= bcnt;
164 buf->sector += bcnt >> 9;
165 if (buf->resid == 0) {
166 d->inprocess = NULL;
167 } else if (buf->bv_resid == 0) {
168 buf->bv++;
Ed L. Cashin392e4842006-09-20 14:36:50 -0400169 WARN_ON(buf->bv->bv_len == 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170 buf->bv_resid = buf->bv->bv_len;
171 buf->bufaddr = page_address(buf->bv->bv_page) + buf->bv->bv_offset;
172 }
173
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400174 skb->dev = d->ifp;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400175 skb = skb_clone(skb, GFP_ATOMIC);
176 if (skb == NULL)
177 return;
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400178 if (d->sendq_hd)
179 d->sendq_tl->next = skb;
180 else
181 d->sendq_hd = skb;
182 d->sendq_tl = skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183}
184
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500185/* some callers cannot sleep, and they can call this function,
186 * transmitting the packets later, when interrupts are on
187 */
188static struct sk_buff *
189aoecmd_cfg_pkts(ushort aoemajor, unsigned char aoeminor, struct sk_buff **tail)
190{
191 struct aoe_hdr *h;
192 struct aoe_cfghdr *ch;
193 struct sk_buff *skb, *sl, *sl_tail;
194 struct net_device *ifp;
195
196 sl = sl_tail = NULL;
197
198 read_lock(&dev_base_lock);
199 for (ifp = dev_base; ifp; dev_put(ifp), ifp = ifp->next) {
200 dev_hold(ifp);
201 if (!is_aoe_netif(ifp))
202 continue;
203
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400204 skb = new_skb(sizeof *h + sizeof *ch);
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500205 if (skb == NULL) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400206 printk(KERN_INFO "aoe: skb alloc failure\n");
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500207 continue;
208 }
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400209 skb->dev = ifp;
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500210 if (sl_tail == NULL)
211 sl_tail = skb;
212 h = (struct aoe_hdr *) skb->mac.raw;
213 memset(h, 0, sizeof *h + sizeof *ch);
214
215 memset(h->dst, 0xff, sizeof h->dst);
216 memcpy(h->src, ifp->dev_addr, sizeof h->src);
217 h->type = __constant_cpu_to_be16(ETH_P_AOE);
218 h->verfl = AOE_HVER;
219 h->major = cpu_to_be16(aoemajor);
220 h->minor = aoeminor;
221 h->cmd = AOECMD_CFG;
222
223 skb->next = sl;
224 sl = skb;
225 }
226 read_unlock(&dev_base_lock);
227
228 if (tail != NULL)
229 *tail = sl_tail;
230 return sl;
231}
232
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400233static struct frame *
234freeframe(struct aoedev *d)
235{
236 struct frame *f, *e;
237 int n = 0;
238
239 f = d->frames;
240 e = f + d->nframes;
241 for (; f<e; f++) {
242 if (f->tag != FREETAG)
243 continue;
244 if (atomic_read(&skb_shinfo(f->skb)->dataref) == 1) {
245 skb_shinfo(f->skb)->nr_frags = f->skb->data_len = 0;
246 return f;
247 }
248 n++;
249 }
250 if (n == d->nframes) /* wait for network layer */
251 d->flags |= DEVFL_KICKME;
252
253 return NULL;
254}
255
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256/* enters with d->lock held */
257void
258aoecmd_work(struct aoedev *d)
259{
260 struct frame *f;
261 struct buf *buf;
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500262
263 if (d->flags & DEVFL_PAUSE) {
264 if (!aoedev_isbusy(d))
265 d->sendq_hd = aoecmd_cfg_pkts(d->aoemajor,
266 d->aoeminor, &d->sendq_tl);
267 return;
268 }
269
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270loop:
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400271 f = freeframe(d);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 if (f == NULL)
273 return;
274 if (d->inprocess == NULL) {
275 if (list_empty(&d->bufq))
276 return;
277 buf = container_of(d->bufq.next, struct buf, bufs);
278 list_del(d->bufq.next);
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400279/*printk(KERN_DEBUG "aoe: bi_size=%ld\n", buf->bio->bi_size); */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 d->inprocess = buf;
281 }
282 aoecmd_ata_rw(d, f);
283 goto loop;
284}
285
286static void
287rexmit(struct aoedev *d, struct frame *f)
288{
289 struct sk_buff *skb;
290 struct aoe_hdr *h;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400291 struct aoe_atahdr *ah;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 char buf[128];
293 u32 n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294
295 n = newtag(d);
296
297 snprintf(buf, sizeof buf,
298 "%15s e%ld.%ld oldtag=%08x@%08lx newtag=%08x\n",
299 "retransmit",
300 d->aoemajor, d->aoeminor, f->tag, jiffies, n);
301 aoechr_error(buf);
302
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400303 skb = f->skb;
304 h = (struct aoe_hdr *) skb->mac.raw;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400305 ah = (struct aoe_atahdr *) (h+1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 f->tag = n;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700307 h->tag = cpu_to_be32(n);
Ed L. Cashin2dd5e422006-01-19 13:46:25 -0500308 memcpy(h->dst, d->addr, sizeof h->dst);
309 memcpy(h->src, d->ifp->dev_addr, sizeof h->src);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400311 n = DEFAULTBCNT / 512;
312 if (ah->scnt > n) {
313 ah->scnt = n;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400314 if (ah->aflags & AOEAFL_WRITE) {
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400315 skb_fill_page_desc(skb, 0, virt_to_page(f->bufaddr),
316 offset_in_page(f->bufaddr), DEFAULTBCNT);
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400317 skb->len = sizeof *h + sizeof *ah + DEFAULTBCNT;
318 skb->data_len = DEFAULTBCNT;
319 }
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400320 if (++d->lostjumbo > (d->nframes << 1))
321 if (d->maxbcnt != DEFAULTBCNT) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400322 printk(KERN_INFO "aoe: e%ld.%ld: too many lost jumbo on %s - using 1KB frames.\n",
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400323 d->aoemajor, d->aoeminor, d->ifp->name);
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400324 d->maxbcnt = DEFAULTBCNT;
325 d->flags |= DEVFL_MAXBCNT;
326 }
327 }
328
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400329 skb->dev = d->ifp;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400330 skb = skb_clone(skb, GFP_ATOMIC);
331 if (skb == NULL)
332 return;
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400333 if (d->sendq_hd)
334 d->sendq_tl->next = skb;
335 else
336 d->sendq_hd = skb;
337 d->sendq_tl = skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338}
339
340static int
341tsince(int tag)
342{
343 int n;
344
345 n = jiffies & 0xffff;
346 n -= tag & 0xffff;
347 if (n < 0)
348 n += 1<<16;
349 return n;
350}
351
352static void
353rexmit_timer(ulong vp)
354{
355 struct aoedev *d;
356 struct frame *f, *e;
357 struct sk_buff *sl;
358 register long timeout;
359 ulong flags, n;
360
361 d = (struct aoedev *) vp;
362 sl = NULL;
363
364 /* timeout is always ~150% of the moving average */
365 timeout = d->rttavg;
366 timeout += timeout >> 1;
367
368 spin_lock_irqsave(&d->lock, flags);
369
370 if (d->flags & DEVFL_TKILL) {
Ed L. Cashin1c6f3fc2006-01-25 13:54:44 -0500371 spin_unlock_irqrestore(&d->lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 return;
373 }
374 f = d->frames;
375 e = f + d->nframes;
376 for (; f<e; f++) {
377 if (f->tag != FREETAG && tsince(f->tag) >= timeout) {
378 n = f->waited += timeout;
379 n /= HZ;
Ed L. Cashinb751e8b2006-09-20 14:36:50 -0400380 if (n > aoe_deadsecs) { /* waited too long for response */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 aoedev_downdev(d);
Ed L. Cashin1c6f3fc2006-01-25 13:54:44 -0500382 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383 }
384 rexmit(d, f);
385 }
386 }
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400387 if (d->flags & DEVFL_KICKME) {
388 d->flags &= ~DEVFL_KICKME;
389 aoecmd_work(d);
390 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391
ecashin@coraid.coma4b38362005-04-18 22:00:22 -0700392 sl = d->sendq_hd;
393 d->sendq_hd = d->sendq_tl = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 if (sl) {
395 n = d->rttavg <<= 1;
396 if (n > MAXTIMER)
397 d->rttavg = MAXTIMER;
398 }
399
400 d->timer.expires = jiffies + TIMERTICK;
401 add_timer(&d->timer);
402
403 spin_unlock_irqrestore(&d->lock, flags);
404
405 aoenet_xmit(sl);
406}
407
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500408/* this function performs work that has been deferred until sleeping is OK
409 */
410void
David Howellsc4028952006-11-22 14:57:56 +0000411aoecmd_sleepwork(struct work_struct *work)
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500412{
David Howellsc4028952006-11-22 14:57:56 +0000413 struct aoedev *d = container_of(work, struct aoedev, work);
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500414
415 if (d->flags & DEVFL_GDALLOC)
416 aoeblk_gdalloc(d);
417
418 if (d->flags & DEVFL_NEWSIZE) {
419 struct block_device *bd;
420 unsigned long flags;
421 u64 ssize;
422
423 ssize = d->gd->capacity;
424 bd = bdget_disk(d->gd, 0);
425
426 if (bd) {
427 mutex_lock(&bd->bd_inode->i_mutex);
428 i_size_write(bd->bd_inode, (loff_t)ssize<<9);
429 mutex_unlock(&bd->bd_inode->i_mutex);
430 bdput(bd);
431 }
432 spin_lock_irqsave(&d->lock, flags);
433 d->flags |= DEVFL_UP;
434 d->flags &= ~DEVFL_NEWSIZE;
435 spin_unlock_irqrestore(&d->lock, flags);
436 }
437}
438
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439static void
440ataid_complete(struct aoedev *d, unsigned char *id)
441{
442 u64 ssize;
443 u16 n;
444
445 /* word 83: command set supported */
Ed L. Cashin475172f2005-09-29 12:47:40 -0400446 n = le16_to_cpu(get_unaligned((__le16 *) &id[83<<1]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447
448 /* word 86: command set/feature enabled */
Ed L. Cashin475172f2005-09-29 12:47:40 -0400449 n |= le16_to_cpu(get_unaligned((__le16 *) &id[86<<1]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450
451 if (n & (1<<10)) { /* bit 10: LBA 48 */
452 d->flags |= DEVFL_EXT;
453
454 /* word 100: number lba48 sectors */
Ed L. Cashin475172f2005-09-29 12:47:40 -0400455 ssize = le64_to_cpu(get_unaligned((__le64 *) &id[100<<1]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456
457 /* set as in ide-disk.c:init_idedisk_capacity */
458 d->geo.cylinders = ssize;
459 d->geo.cylinders /= (255 * 63);
460 d->geo.heads = 255;
461 d->geo.sectors = 63;
462 } else {
463 d->flags &= ~DEVFL_EXT;
464
465 /* number lba28 sectors */
Ed L. Cashin475172f2005-09-29 12:47:40 -0400466 ssize = le32_to_cpu(get_unaligned((__le32 *) &id[60<<1]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700467
468 /* NOTE: obsolete in ATA 6 */
Ed L. Cashin475172f2005-09-29 12:47:40 -0400469 d->geo.cylinders = le16_to_cpu(get_unaligned((__le16 *) &id[54<<1]));
470 d->geo.heads = le16_to_cpu(get_unaligned((__le16 *) &id[55<<1]));
471 d->geo.sectors = le16_to_cpu(get_unaligned((__le16 *) &id[56<<1]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472 }
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500473
474 if (d->ssize != ssize)
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400475 printk(KERN_INFO "aoe: %012llx e%lu.%lu v%04x has %llu sectors\n",
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400476 (unsigned long long)mac_addr(d->addr),
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500477 d->aoemajor, d->aoeminor,
478 d->fw_ver, (long long)ssize);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479 d->ssize = ssize;
480 d->geo.start = 0;
481 if (d->gd != NULL) {
482 d->gd->capacity = ssize;
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500483 d->flags |= DEVFL_NEWSIZE;
484 } else {
485 if (d->flags & DEVFL_GDALLOC) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400486 printk(KERN_ERR "aoe: can't schedule work for e%lu.%lu, %s\n",
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500487 d->aoemajor, d->aoeminor,
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400488 "it's already on! This shouldn't happen.\n");
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500489 return;
490 }
491 d->flags |= DEVFL_GDALLOC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493 schedule_work(&d->work);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494}
495
496static void
497calc_rttavg(struct aoedev *d, int rtt)
498{
499 register long n;
500
501 n = rtt;
Ed L. Cashindced3a02006-09-20 14:36:49 -0400502 if (n < 0) {
503 n = -rtt;
504 if (n < MINTIMER)
505 n = MINTIMER;
506 else if (n > MAXTIMER)
507 n = MAXTIMER;
508 d->mintimer += (n - d->mintimer) >> 1;
509 } else if (n < d->mintimer)
510 n = d->mintimer;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 else if (n > MAXTIMER)
512 n = MAXTIMER;
513
514 /* g == .25; cf. Congestion Avoidance and Control, Jacobson & Karels; 1988 */
515 n -= d->rttavg;
516 d->rttavg += n >> 2;
517}
518
519void
520aoecmd_ata_rsp(struct sk_buff *skb)
521{
522 struct aoedev *d;
Ed L. Cashinddec63e2006-09-20 14:36:49 -0400523 struct aoe_hdr *hin, *hout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 struct aoe_atahdr *ahin, *ahout;
525 struct frame *f;
526 struct buf *buf;
527 struct sk_buff *sl;
528 register long n;
529 ulong flags;
530 char ebuf[128];
ecashin@coraid.com32465c62005-04-18 22:00:18 -0700531 u16 aoemajor;
532
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533 hin = (struct aoe_hdr *) skb->mac.raw;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700534 aoemajor = be16_to_cpu(hin->major);
ecashin@coraid.com32465c62005-04-18 22:00:18 -0700535 d = aoedev_by_aoeaddr(aoemajor, hin->minor);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 if (d == NULL) {
537 snprintf(ebuf, sizeof ebuf, "aoecmd_ata_rsp: ata response "
538 "for unknown device %d.%d\n",
ecashin@coraid.com32465c62005-04-18 22:00:18 -0700539 aoemajor, hin->minor);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540 aoechr_error(ebuf);
541 return;
542 }
543
544 spin_lock_irqsave(&d->lock, flags);
545
Ed L. Cashindced3a02006-09-20 14:36:49 -0400546 n = be32_to_cpu(hin->tag);
547 f = getframe(d, n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548 if (f == NULL) {
Ed L. Cashindced3a02006-09-20 14:36:49 -0400549 calc_rttavg(d, -tsince(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700550 spin_unlock_irqrestore(&d->lock, flags);
551 snprintf(ebuf, sizeof ebuf,
552 "%15s e%d.%d tag=%08x@%08lx\n",
553 "unexpected rsp",
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700554 be16_to_cpu(hin->major),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 hin->minor,
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700556 be32_to_cpu(hin->tag),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 jiffies);
558 aoechr_error(ebuf);
559 return;
560 }
561
562 calc_rttavg(d, tsince(f->tag));
563
564 ahin = (struct aoe_atahdr *) (hin+1);
Ed L. Cashinddec63e2006-09-20 14:36:49 -0400565 hout = (struct aoe_hdr *) f->skb->mac.raw;
566 ahout = (struct aoe_atahdr *) (hout+1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567 buf = f->buf;
568
Ed L. Cashin9d419652006-02-07 11:37:24 -0500569 if (ahout->cmdstat == WIN_IDENTIFY)
570 d->flags &= ~DEVFL_PAUSE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 if (ahin->cmdstat & 0xa9) { /* these bits cleared on success */
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400572 printk(KERN_ERR
573 "aoe: ata error cmd=%2.2Xh stat=%2.2Xh from e%ld.%ld\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574 ahout->cmdstat, ahin->cmdstat,
575 d->aoemajor, d->aoeminor);
576 if (buf)
577 buf->flags |= BUFFL_FAIL;
578 } else {
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400579 n = ahout->scnt << 9;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 switch (ahout->cmdstat) {
581 case WIN_READ:
582 case WIN_READ_EXT:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583 if (skb->len - sizeof *hin - sizeof *ahin < n) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400584 printk(KERN_ERR
585 "aoe: runt data size in read. skb->len=%d\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 skb->len);
587 /* fail frame f? just returning will rexmit. */
588 spin_unlock_irqrestore(&d->lock, flags);
589 return;
590 }
591 memcpy(f->bufaddr, ahin+1, n);
592 case WIN_WRITE:
593 case WIN_WRITE_EXT:
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400594 if (f->bcnt -= n) {
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400595 skb = f->skb;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400596 f->bufaddr += n;
597 put_lba(ahout, f->lba += ahout->scnt);
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400598 n = f->bcnt;
599 if (n > DEFAULTBCNT)
600 n = DEFAULTBCNT;
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400601 ahout->scnt = n >> 9;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400602 if (ahout->aflags & AOEAFL_WRITE) {
603 skb_fill_page_desc(skb, 0,
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400604 virt_to_page(f->bufaddr),
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400605 offset_in_page(f->bufaddr), n);
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400606 skb->len = sizeof *hout + sizeof *ahout + n;
607 skb->data_len = n;
608 }
Ed L. Cashinddec63e2006-09-20 14:36:49 -0400609 f->tag = newtag(d);
610 hout->tag = cpu_to_be32(f->tag);
611 skb->dev = d->ifp;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400612 skb = skb_clone(skb, GFP_ATOMIC);
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400613 spin_unlock_irqrestore(&d->lock, flags);
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400614 if (skb)
615 aoenet_xmit(skb);
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400616 return;
617 }
618 if (n > DEFAULTBCNT)
619 d->lostjumbo = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700620 break;
621 case WIN_IDENTIFY:
622 if (skb->len - sizeof *hin - sizeof *ahin < 512) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400623 printk(KERN_INFO
624 "aoe: runt data size in ataid. skb->len=%d\n",
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400625 skb->len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 spin_unlock_irqrestore(&d->lock, flags);
627 return;
628 }
629 ataid_complete(d, (char *) (ahin+1));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630 break;
631 default:
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400632 printk(KERN_INFO
633 "aoe: unrecognized ata command %2.2Xh for %d.%d\n",
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400634 ahout->cmdstat,
635 be16_to_cpu(hin->major),
636 hin->minor);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637 }
638 }
639
640 if (buf) {
641 buf->nframesout -= 1;
642 if (buf->nframesout == 0 && buf->resid == 0) {
ecashin@coraid.com0c6f0e72005-04-18 22:00:22 -0700643 unsigned long duration = jiffies - buf->start_time;
644 unsigned long n_sect = buf->bio->bi_size >> 9;
645 struct gendisk *disk = d->gd;
Jens Axboe496456c2005-11-01 09:54:23 +0100646 const int rw = bio_data_dir(buf->bio);
ecashin@coraid.com0c6f0e72005-04-18 22:00:22 -0700647
Jens Axboe496456c2005-11-01 09:54:23 +0100648 disk_stat_inc(disk, ios[rw]);
649 disk_stat_add(disk, ticks[rw], duration);
650 disk_stat_add(disk, sectors[rw], n_sect);
ecashin@coraid.com0c6f0e72005-04-18 22:00:22 -0700651 disk_stat_add(disk, io_ticks, duration);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 n = (buf->flags & BUFFL_FAIL) ? -EIO : 0;
653 bio_endio(buf->bio, buf->bio->bi_size, n);
654 mempool_free(buf, d->bufpool);
655 }
656 }
657
658 f->buf = NULL;
659 f->tag = FREETAG;
660
661 aoecmd_work(d);
ecashin@coraid.coma4b38362005-04-18 22:00:22 -0700662 sl = d->sendq_hd;
663 d->sendq_hd = d->sendq_tl = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664
665 spin_unlock_irqrestore(&d->lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700666 aoenet_xmit(sl);
667}
668
669void
670aoecmd_cfg(ushort aoemajor, unsigned char aoeminor)
671{
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500672 struct sk_buff *sl;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500674 sl = aoecmd_cfg_pkts(aoemajor, aoeminor, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675
676 aoenet_xmit(sl);
677}
678
679/*
680 * Since we only call this in one place (and it only prepares one frame)
ecashin@coraid.coma4b38362005-04-18 22:00:22 -0700681 * we just return the skb. Usually we'd chain it up to the aoedev sendq.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700682 */
683static struct sk_buff *
684aoecmd_ata_id(struct aoedev *d)
685{
686 struct aoe_hdr *h;
687 struct aoe_atahdr *ah;
688 struct frame *f;
689 struct sk_buff *skb;
690
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400691 f = freeframe(d);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692 if (f == NULL) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400693 printk(KERN_ERR "aoe: can't get a frame. This shouldn't happen.\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 return NULL;
695 }
696
697 /* initialize the headers & frame */
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400698 skb = f->skb;
699 h = (struct aoe_hdr *) skb->mac.raw;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 ah = (struct aoe_atahdr *) (h+1);
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400701 skb->len = ETH_ZLEN;
702 memset(h, 0, ETH_ZLEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700703 f->tag = aoehdr_atainit(d, h);
704 f->waited = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706 /* set up ata header */
707 ah->scnt = 1;
708 ah->cmdstat = WIN_IDENTIFY;
709 ah->lba3 = 0xa0;
710
Ed L. Cashine407a7f2006-09-20 14:36:49 -0400711 skb->dev = d->ifp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700712
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500713 d->rttavg = MAXTIMER;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 d->timer.function = rexmit_timer;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400716 return skb_clone(skb, GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717}
718
719void
720aoecmd_cfg_rsp(struct sk_buff *skb)
721{
722 struct aoedev *d;
723 struct aoe_hdr *h;
724 struct aoe_cfghdr *ch;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700725 ulong flags, sysminor, aoemajor;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726 struct sk_buff *sl;
Ed L. Cashineaf0a3c2006-01-19 13:46:20 -0500727 enum { MAXFRAMES = 16 };
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400728 u16 n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729
730 h = (struct aoe_hdr *) skb->mac.raw;
731 ch = (struct aoe_cfghdr *) (h+1);
732
733 /*
734 * Enough people have their dip switches set backwards to
735 * warrant a loud message for this special case.
736 */
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700737 aoemajor = be16_to_cpu(h->major);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 if (aoemajor == 0xfff) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400739 printk(KERN_ERR "aoe: Warning: shelf address is all ones. "
Ed L. Cashin6bb6285f2006-09-20 14:36:49 -0400740 "Check shelf dip switches.\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 return;
742 }
743
744 sysminor = SYSMINOR(aoemajor, h->minor);
ecashin@coraid.comfc458dc2005-04-18 22:00:17 -0700745 if (sysminor * AOE_PARTITIONS + AOE_PARTITIONS > MINORMASK) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400746 printk(KERN_INFO "aoe: e%ld.%d: minor number too large\n",
ecashin@coraid.comfc458dc2005-04-18 22:00:17 -0700747 aoemajor, (int) h->minor);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 return;
749 }
750
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400751 n = be16_to_cpu(ch->bufcnt);
752 if (n > MAXFRAMES) /* keep it reasonable */
753 n = MAXFRAMES;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400755 d = aoedev_by_sysminor_m(sysminor, n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756 if (d == NULL) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400757 printk(KERN_INFO "aoe: device sysminor_m failure\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 return;
759 }
760
761 spin_lock_irqsave(&d->lock, flags);
762
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500763 /* permit device to migrate mac and network interface */
764 d->ifp = skb->dev;
765 memcpy(d->addr, h->src, sizeof d->addr);
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400766 if (!(d->flags & DEVFL_MAXBCNT)) {
767 n = d->ifp->mtu;
768 n -= sizeof (struct aoe_hdr) + sizeof (struct aoe_atahdr);
769 n /= 512;
770 if (n > ch->scnt)
771 n = ch->scnt;
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400772 n = n ? n * 512 : DEFAULTBCNT;
773 if (n != d->maxbcnt) {
Ed L. Cashina12c93f2006-09-20 14:36:51 -0400774 printk(KERN_INFO
775 "aoe: e%ld.%ld: setting %d byte data frames on %s\n",
Ed L. Cashin4f51dc52006-09-20 14:36:49 -0400776 d->aoemajor, d->aoeminor, n, d->ifp->name);
777 d->maxbcnt = n;
778 }
Ed L. Cashin19bf2632006-09-20 14:36:49 -0400779 }
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500780
781 /* don't change users' perspective */
782 if (d->nopen && !(d->flags & DEVFL_PAUSE)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 spin_unlock_irqrestore(&d->lock, flags);
784 return;
785 }
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500786 d->flags |= DEVFL_PAUSE; /* force pause */
Ed L. Cashindced3a02006-09-20 14:36:49 -0400787 d->mintimer = MINTIMER;
ecashin@coraid.com63e9cc52005-04-18 22:00:20 -0700788 d->fw_ver = be16_to_cpu(ch->fwver);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700789
Ed L. Cashin3ae1c242006-01-19 13:46:19 -0500790 /* check for already outstanding ataid */
791 sl = aoedev_isbusy(d) == 0 ? aoecmd_ata_id(d) : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792
793 spin_unlock_irqrestore(&d->lock, flags);
794
795 aoenet_xmit(sl);
796}
797