]> bbs.cooldavid.org Git - net-next-2.6.git/blame - drivers/block/aoe/aoecmd.c
aoe: remove dev_base_lock use from aoecmd_cfg_pkts()
[net-next-2.6.git] / drivers / block / aoe / aoecmd.c
CommitLineData
52e112b3 1/* Copyright (c) 2007 Coraid, Inc. See COPYING for GPL terms. */
1da177e4
LT
2/*
3 * aoecmd.c
4 * Filesystem request handling methods
5 */
6
04b3ab52 7#include <linux/ata.h>
5a0e3ad6 8#include <linux/slab.h>
1da177e4
LT
9#include <linux/hdreg.h>
10#include <linux/blkdev.h>
11#include <linux/skbuff.h>
12#include <linux/netdevice.h>
3ae1c24e 13#include <linux/genhd.h>
68e0d42f 14#include <linux/moduleparam.h>
881d966b 15#include <net/net_namespace.h>
475172fb 16#include <asm/unaligned.h>
1da177e4
LT
17#include "aoe.h"
18
b751e8b6
EC
19static int aoe_deadsecs = 60 * 3;
20module_param(aoe_deadsecs, int, 0644);
21MODULE_PARM_DESC(aoe_deadsecs, "After aoe_deadsecs seconds, give up and fail dev.");
1da177e4 22
7df620d8
EC
23static int aoe_maxout = 16;
24module_param(aoe_maxout, int, 0644);
25MODULE_PARM_DESC(aoe_maxout,
26 "Only aoe_maxout outstanding packets for every MAC on eX.Y.");
27
68e0d42f 28static struct sk_buff *
e407a7f6 29new_skb(ulong len)
1da177e4
LT
30{
31 struct sk_buff *skb;
32
33 skb = alloc_skb(len, GFP_ATOMIC);
34 if (skb) {
459a98ed 35 skb_reset_mac_header(skb);
c1d2bbe1 36 skb_reset_network_header(skb);
1da177e4 37 skb->protocol = __constant_htons(ETH_P_AOE);
1da177e4
LT
38 }
39 return skb;
40}
41
1da177e4 42static struct frame *
68e0d42f 43getframe(struct aoetgt *t, int tag)
1da177e4
LT
44{
45 struct frame *f, *e;
46
68e0d42f
EC
47 f = t->frames;
48 e = f + t->nframes;
1da177e4
LT
49 for (; f<e; f++)
50 if (f->tag == tag)
51 return f;
52 return NULL;
53}
54
55/*
56 * Leave the top bit clear so we have tagspace for userland.
57 * The bottom 16 bits are the xmit tick for rexmit/rttavg processing.
58 * This driver reserves tag -1 to mean "unused frame."
59 */
60static int
68e0d42f 61newtag(struct aoetgt *t)
1da177e4
LT
62{
63 register ulong n;
64
65 n = jiffies & 0xffff;
68e0d42f 66 return n |= (++t->lasttag & 0x7fff) << 16;
1da177e4
LT
67}
68
69static int
68e0d42f 70aoehdr_atainit(struct aoedev *d, struct aoetgt *t, struct aoe_hdr *h)
1da177e4 71{
68e0d42f 72 u32 host_tag = newtag(t);
1da177e4 73
68e0d42f
EC
74 memcpy(h->src, t->ifp->nd->dev_addr, sizeof h->src);
75 memcpy(h->dst, t->addr, sizeof h->dst);
63e9cc5d 76 h->type = __constant_cpu_to_be16(ETH_P_AOE);
1da177e4 77 h->verfl = AOE_HVER;
63e9cc5d 78 h->major = cpu_to_be16(d->aoemajor);
1da177e4
LT
79 h->minor = d->aoeminor;
80 h->cmd = AOECMD_ATA;
63e9cc5d 81 h->tag = cpu_to_be32(host_tag);
1da177e4
LT
82
83 return host_tag;
84}
85
19bf2635
EC
86static inline void
87put_lba(struct aoe_atahdr *ah, sector_t lba)
88{
89 ah->lba0 = lba;
90 ah->lba1 = lba >>= 8;
91 ah->lba2 = lba >>= 8;
92 ah->lba3 = lba >>= 8;
93 ah->lba4 = lba >>= 8;
94 ah->lba5 = lba >>= 8;
95}
96
1da177e4 97static void
68e0d42f
EC
98ifrotate(struct aoetgt *t)
99{
100 t->ifp++;
101 if (t->ifp >= &t->ifs[NAOEIFS] || t->ifp->nd == NULL)
102 t->ifp = t->ifs;
103 if (t->ifp->nd == NULL) {
104 printk(KERN_INFO "aoe: no interface to rotate to\n");
105 BUG();
106 }
107}
108
9bb237b6
EC
109static void
110skb_pool_put(struct aoedev *d, struct sk_buff *skb)
111{
e9bb8fb0 112 __skb_queue_tail(&d->skbpool, skb);
9bb237b6
EC
113}
114
115static struct sk_buff *
116skb_pool_get(struct aoedev *d)
117{
e9bb8fb0 118 struct sk_buff *skb = skb_peek(&d->skbpool);
9bb237b6 119
9bb237b6 120 if (skb && atomic_read(&skb_shinfo(skb)->dataref) == 1) {
e9bb8fb0 121 __skb_unlink(skb, &d->skbpool);
9bb237b6
EC
122 return skb;
123 }
e9bb8fb0
DM
124 if (skb_queue_len(&d->skbpool) < NSKBPOOLMAX &&
125 (skb = new_skb(ETH_ZLEN)))
9bb237b6 126 return skb;
e9bb8fb0 127
9bb237b6
EC
128 return NULL;
129}
130
131/* freeframe is where we do our load balancing so it's a little hairy. */
68e0d42f
EC
132static struct frame *
133freeframe(struct aoedev *d)
1da177e4 134{
9bb237b6 135 struct frame *f, *e, *rf;
68e0d42f 136 struct aoetgt **t;
9bb237b6 137 struct sk_buff *skb;
68e0d42f
EC
138
139 if (d->targets[0] == NULL) { /* shouldn't happen, but I'm paranoid */
140 printk(KERN_ERR "aoe: NULL TARGETS!\n");
141 return NULL;
142 }
9bb237b6
EC
143 t = d->tgt;
144 t++;
145 if (t >= &d->targets[NTARGETS] || !*t)
146 t = d->targets;
147 for (;;) {
148 if ((*t)->nout < (*t)->maxout
149 && t != d->htgt
150 && (*t)->ifp->nd) {
151 rf = NULL;
68e0d42f 152 f = (*t)->frames;
9bb237b6 153 e = f + (*t)->nframes;
68e0d42f
EC
154 for (; f < e; f++) {
155 if (f->tag != FREETAG)
156 continue;
9bb237b6
EC
157 skb = f->skb;
158 if (!skb
159 && !(f->skb = skb = new_skb(ETH_ZLEN)))
160 continue;
161 if (atomic_read(&skb_shinfo(skb)->dataref)
68e0d42f 162 != 1) {
9bb237b6
EC
163 if (!rf)
164 rf = f;
68e0d42f
EC
165 continue;
166 }
9bb237b6
EC
167gotone: skb_shinfo(skb)->nr_frags = skb->data_len = 0;
168 skb_trim(skb, 0);
68e0d42f
EC
169 d->tgt = t;
170 ifrotate(*t);
171 return f;
172 }
9bb237b6
EC
173 /* Work can be done, but the network layer is
174 holding our precious packets. Try to grab
175 one from the pool. */
176 f = rf;
177 if (f == NULL) { /* more paranoia */
178 printk(KERN_ERR
179 "aoe: freeframe: %s.\n",
180 "unexpected null rf");
181 d->flags |= DEVFL_KICKME;
182 return NULL;
183 }
184 skb = skb_pool_get(d);
185 if (skb) {
186 skb_pool_put(d, f->skb);
187 f->skb = skb;
188 goto gotone;
189 }
190 (*t)->dataref++;
191 if ((*t)->nout == 0)
68e0d42f
EC
192 d->flags |= DEVFL_KICKME;
193 }
9bb237b6
EC
194 if (t == d->tgt) /* we've looped and found nada */
195 break;
68e0d42f 196 t++;
9bb237b6
EC
197 if (t >= &d->targets[NTARGETS] || !*t)
198 t = d->targets;
199 }
68e0d42f
EC
200 return NULL;
201}
202
203static int
204aoecmd_ata_rw(struct aoedev *d)
205{
206 struct frame *f;
1da177e4
LT
207 struct aoe_hdr *h;
208 struct aoe_atahdr *ah;
209 struct buf *buf;
68e0d42f
EC
210 struct bio_vec *bv;
211 struct aoetgt *t;
1da177e4
LT
212 struct sk_buff *skb;
213 ulong bcnt;
1da177e4
LT
214 char writebit, extbit;
215
216 writebit = 0x10;
217 extbit = 0x4;
218
68e0d42f
EC
219 f = freeframe(d);
220 if (f == NULL)
221 return 0;
222 t = *d->tgt;
1da177e4 223 buf = d->inprocess;
68e0d42f
EC
224 bv = buf->bv;
225 bcnt = t->ifp->maxbcnt;
226 if (bcnt == 0)
227 bcnt = DEFAULTBCNT;
228 if (bcnt > buf->bv_resid)
229 bcnt = buf->bv_resid;
1da177e4 230 /* initialize the headers & frame */
e407a7f6 231 skb = f->skb;
abdbf94d 232 h = (struct aoe_hdr *) skb_mac_header(skb);
1da177e4 233 ah = (struct aoe_atahdr *) (h+1);
19900cde
EC
234 skb_put(skb, sizeof *h + sizeof *ah);
235 memset(h, 0, skb->len);
68e0d42f
EC
236 f->tag = aoehdr_atainit(d, t, h);
237 t->nout++;
1da177e4
LT
238 f->waited = 0;
239 f->buf = buf;
68e0d42f 240 f->bufaddr = page_address(bv->bv_page) + buf->bv_off;
19bf2635 241 f->bcnt = bcnt;
68e0d42f 242 f->lba = buf->sector;
1da177e4
LT
243
244 /* set up ata header */
245 ah->scnt = bcnt >> 9;
68e0d42f 246 put_lba(ah, buf->sector);
1da177e4
LT
247 if (d->flags & DEVFL_EXT) {
248 ah->aflags |= AOEAFL_EXT;
1da177e4
LT
249 } else {
250 extbit = 0;
251 ah->lba3 &= 0x0f;
252 ah->lba3 |= 0xe0; /* LBA bit + obsolete 0xa0 */
253 }
1da177e4 254 if (bio_data_dir(buf->bio) == WRITE) {
68e0d42f 255 skb_fill_page_desc(skb, 0, bv->bv_page, buf->bv_off, bcnt);
1da177e4 256 ah->aflags |= AOEAFL_WRITE;
4f51dc5e
EC
257 skb->len += bcnt;
258 skb->data_len = bcnt;
68e0d42f 259 t->wpkts++;
1da177e4 260 } else {
68e0d42f 261 t->rpkts++;
1da177e4 262 writebit = 0;
1da177e4
LT
263 }
264
04b3ab52 265 ah->cmdstat = ATA_CMD_PIO_READ | writebit | extbit;
1da177e4
LT
266
267 /* mark all tracking fields and load out */
268 buf->nframesout += 1;
68e0d42f 269 buf->bv_off += bcnt;
1da177e4 270 buf->bv_resid -= bcnt;
1da177e4
LT
271 buf->resid -= bcnt;
272 buf->sector += bcnt >> 9;
273 if (buf->resid == 0) {
274 d->inprocess = NULL;
275 } else if (buf->bv_resid == 0) {
68e0d42f
EC
276 buf->bv = ++bv;
277 buf->bv_resid = bv->bv_len;
278 WARN_ON(buf->bv_resid == 0);
279 buf->bv_off = bv->bv_offset;
1da177e4
LT
280 }
281
68e0d42f 282 skb->dev = t->ifp->nd;
4f51dc5e 283 skb = skb_clone(skb, GFP_ATOMIC);
e9bb8fb0
DM
284 if (skb)
285 __skb_queue_tail(&d->sendq, skb);
68e0d42f 286 return 1;
1da177e4
LT
287}
288
3ae1c24e
EC
289/* some callers cannot sleep, and they can call this function,
290 * transmitting the packets later, when interrupts are on
291 */
e9bb8fb0
DM
292static void
293aoecmd_cfg_pkts(ushort aoemajor, unsigned char aoeminor, struct sk_buff_head *queue)
3ae1c24e
EC
294{
295 struct aoe_hdr *h;
296 struct aoe_cfghdr *ch;
e9bb8fb0 297 struct sk_buff *skb;
3ae1c24e
EC
298 struct net_device *ifp;
299
840a185d
ED
300 rcu_read_lock();
301 for_each_netdev_rcu(&init_net, ifp) {
3ae1c24e
EC
302 dev_hold(ifp);
303 if (!is_aoe_netif(ifp))
7562f876 304 goto cont;
3ae1c24e 305
e407a7f6 306 skb = new_skb(sizeof *h + sizeof *ch);
3ae1c24e 307 if (skb == NULL) {
a12c93f0 308 printk(KERN_INFO "aoe: skb alloc failure\n");
7562f876 309 goto cont;
3ae1c24e 310 }
19900cde 311 skb_put(skb, sizeof *h + sizeof *ch);
e407a7f6 312 skb->dev = ifp;
e9bb8fb0 313 __skb_queue_tail(queue, skb);
abdbf94d 314 h = (struct aoe_hdr *) skb_mac_header(skb);
3ae1c24e
EC
315 memset(h, 0, sizeof *h + sizeof *ch);
316
317 memset(h->dst, 0xff, sizeof h->dst);
318 memcpy(h->src, ifp->dev_addr, sizeof h->src);
319 h->type = __constant_cpu_to_be16(ETH_P_AOE);
320 h->verfl = AOE_HVER;
321 h->major = cpu_to_be16(aoemajor);
322 h->minor = aoeminor;
323 h->cmd = AOECMD_CFG;
324
7562f876
PE
325cont:
326 dev_put(ifp);
3ae1c24e 327 }
840a185d 328 rcu_read_unlock();
3ae1c24e
EC
329}
330
1da177e4 331static void
68e0d42f 332resend(struct aoedev *d, struct aoetgt *t, struct frame *f)
1da177e4
LT
333{
334 struct sk_buff *skb;
335 struct aoe_hdr *h;
19bf2635 336 struct aoe_atahdr *ah;
1da177e4
LT
337 char buf[128];
338 u32 n;
1da177e4 339
68e0d42f
EC
340 ifrotate(t);
341 n = newtag(t);
342 skb = f->skb;
343 h = (struct aoe_hdr *) skb_mac_header(skb);
344 ah = (struct aoe_atahdr *) (h+1);
1da177e4
LT
345
346 snprintf(buf, sizeof buf,
411c41ee 347 "%15s e%ld.%d oldtag=%08x@%08lx newtag=%08x s=%pm d=%pm nout=%d\n",
68e0d42f 348 "retransmit", d->aoemajor, d->aoeminor, f->tag, jiffies, n,
411c41ee 349 h->src, h->dst, t->nout);
1da177e4
LT
350 aoechr_error(buf);
351
1da177e4 352 f->tag = n;
63e9cc5d 353 h->tag = cpu_to_be32(n);
68e0d42f
EC
354 memcpy(h->dst, t->addr, sizeof h->dst);
355 memcpy(h->src, t->ifp->nd->dev_addr, sizeof h->src);
356
357 switch (ah->cmdstat) {
358 default:
359 break;
04b3ab52
BZ
360 case ATA_CMD_PIO_READ:
361 case ATA_CMD_PIO_READ_EXT:
362 case ATA_CMD_PIO_WRITE:
363 case ATA_CMD_PIO_WRITE_EXT:
68e0d42f
EC
364 put_lba(ah, f->lba);
365
366 n = f->bcnt;
367 if (n > DEFAULTBCNT)
368 n = DEFAULTBCNT;
369 ah->scnt = n >> 9;
4f51dc5e 370 if (ah->aflags & AOEAFL_WRITE) {
19bf2635 371 skb_fill_page_desc(skb, 0, virt_to_page(f->bufaddr),
68e0d42f
EC
372 offset_in_page(f->bufaddr), n);
373 skb->len = sizeof *h + sizeof *ah + n;
374 skb->data_len = n;
19bf2635
EC
375 }
376 }
68e0d42f 377 skb->dev = t->ifp->nd;
4f51dc5e
EC
378 skb = skb_clone(skb, GFP_ATOMIC);
379 if (skb == NULL)
380 return;
e9bb8fb0 381 __skb_queue_tail(&d->sendq, skb);
1da177e4
LT
382}
383
384static int
385tsince(int tag)
386{
387 int n;
388
389 n = jiffies & 0xffff;
390 n -= tag & 0xffff;
391 if (n < 0)
392 n += 1<<16;
393 return n;
394}
395
68e0d42f
EC
396static struct aoeif *
397getif(struct aoetgt *t, struct net_device *nd)
398{
399 struct aoeif *p, *e;
400
401 p = t->ifs;
402 e = p + NAOEIFS;
403 for (; p < e; p++)
404 if (p->nd == nd)
405 return p;
406 return NULL;
407}
408
409static struct aoeif *
410addif(struct aoetgt *t, struct net_device *nd)
411{
412 struct aoeif *p;
413
414 p = getif(t, NULL);
415 if (!p)
416 return NULL;
417 p->nd = nd;
418 p->maxbcnt = DEFAULTBCNT;
419 p->lost = 0;
420 p->lostjumbo = 0;
421 return p;
422}
423
424static void
425ejectif(struct aoetgt *t, struct aoeif *ifp)
426{
427 struct aoeif *e;
428 ulong n;
429
430 e = t->ifs + NAOEIFS - 1;
431 n = (e - ifp) * sizeof *ifp;
432 memmove(ifp, ifp+1, n);
433 e->nd = NULL;
434}
435
436static int
437sthtith(struct aoedev *d)
438{
439 struct frame *f, *e, *nf;
440 struct sk_buff *skb;
441 struct aoetgt *ht = *d->htgt;
442
443 f = ht->frames;
444 e = f + ht->nframes;
445 for (; f < e; f++) {
446 if (f->tag == FREETAG)
447 continue;
448 nf = freeframe(d);
449 if (!nf)
450 return 0;
451 skb = nf->skb;
452 *nf = *f;
453 f->skb = skb;
454 f->tag = FREETAG;
455 nf->waited = 0;
456 ht->nout--;
457 (*d->tgt)->nout++;
458 resend(d, *d->tgt, nf);
459 }
460 /* he's clean, he's useless. take away his interfaces */
461 memset(ht->ifs, 0, sizeof ht->ifs);
462 d->htgt = NULL;
463 return 1;
464}
465
466static inline unsigned char
467ata_scnt(unsigned char *packet) {
468 struct aoe_hdr *h;
469 struct aoe_atahdr *ah;
470
471 h = (struct aoe_hdr *) packet;
472 ah = (struct aoe_atahdr *) (h+1);
473 return ah->scnt;
474}
475
1da177e4
LT
476static void
477rexmit_timer(ulong vp)
478{
e9bb8fb0 479 struct sk_buff_head queue;
1da177e4 480 struct aoedev *d;
68e0d42f
EC
481 struct aoetgt *t, **tt, **te;
482 struct aoeif *ifp;
1da177e4 483 struct frame *f, *e;
1da177e4
LT
484 register long timeout;
485 ulong flags, n;
486
487 d = (struct aoedev *) vp;
1da177e4
LT
488
489 /* timeout is always ~150% of the moving average */
490 timeout = d->rttavg;
491 timeout += timeout >> 1;
492
493 spin_lock_irqsave(&d->lock, flags);
494
495 if (d->flags & DEVFL_TKILL) {
1c6f3fca 496 spin_unlock_irqrestore(&d->lock, flags);
1da177e4
LT
497 return;
498 }
68e0d42f
EC
499 tt = d->targets;
500 te = tt + NTARGETS;
501 for (; tt < te && *tt; tt++) {
502 t = *tt;
503 f = t->frames;
504 e = f + t->nframes;
505 for (; f < e; f++) {
506 if (f->tag == FREETAG
507 || tsince(f->tag) < timeout)
508 continue;
1da177e4
LT
509 n = f->waited += timeout;
510 n /= HZ;
68e0d42f
EC
511 if (n > aoe_deadsecs) {
512 /* waited too long. device failure. */
1da177e4 513 aoedev_downdev(d);
1c6f3fca 514 break;
1da177e4 515 }
68e0d42f
EC
516
517 if (n > HELPWAIT /* see if another target can help */
518 && (tt != d->targets || d->targets[1]))
519 d->htgt = tt;
520
521 if (t->nout == t->maxout) {
522 if (t->maxout > 1)
523 t->maxout--;
524 t->lastwadj = jiffies;
525 }
526
527 ifp = getif(t, f->skb->dev);
528 if (ifp && ++ifp->lost > (t->nframes << 1)
529 && (ifp != t->ifs || t->ifs[1].nd)) {
530 ejectif(t, ifp);
531 ifp = NULL;
532 }
533
534 if (ata_scnt(skb_mac_header(f->skb)) > DEFAULTBCNT / 512
535 && ifp && ++ifp->lostjumbo > (t->nframes << 1)
536 && ifp->maxbcnt != DEFAULTBCNT) {
537 printk(KERN_INFO
538 "aoe: e%ld.%d: "
539 "too many lost jumbo on "
411c41ee 540 "%s:%pm - "
68e0d42f
EC
541 "falling back to %d frames.\n",
542 d->aoemajor, d->aoeminor,
411c41ee 543 ifp->nd->name, t->addr,
68e0d42f
EC
544 DEFAULTBCNT);
545 ifp->maxbcnt = 0;
546 }
547 resend(d, t, f);
548 }
549
550 /* window check */
551 if (t->nout == t->maxout
552 && t->maxout < t->nframes
553 && (jiffies - t->lastwadj)/HZ > 10) {
554 t->maxout++;
555 t->lastwadj = jiffies;
1da177e4
LT
556 }
557 }
68e0d42f 558
e9bb8fb0 559 if (!skb_queue_empty(&d->sendq)) {
68e0d42f
EC
560 n = d->rttavg <<= 1;
561 if (n > MAXTIMER)
562 d->rttavg = MAXTIMER;
563 }
564
565 if (d->flags & DEVFL_KICKME || d->htgt) {
4f51dc5e
EC
566 d->flags &= ~DEVFL_KICKME;
567 aoecmd_work(d);
568 }
1da177e4 569
e9bb8fb0
DM
570 __skb_queue_head_init(&queue);
571 skb_queue_splice_init(&d->sendq, &queue);
1da177e4
LT
572
573 d->timer.expires = jiffies + TIMERTICK;
574 add_timer(&d->timer);
575
576 spin_unlock_irqrestore(&d->lock, flags);
577
e9bb8fb0 578 aoenet_xmit(&queue);
1da177e4
LT
579}
580
68e0d42f
EC
581/* enters with d->lock held */
582void
583aoecmd_work(struct aoedev *d)
584{
585 struct buf *buf;
586loop:
587 if (d->htgt && !sthtith(d))
588 return;
589 if (d->inprocess == NULL) {
590 if (list_empty(&d->bufq))
591 return;
592 buf = container_of(d->bufq.next, struct buf, bufs);
593 list_del(d->bufq.next);
594 d->inprocess = buf;
595 }
596 if (aoecmd_ata_rw(d))
597 goto loop;
598}
599
3ae1c24e
EC
600/* this function performs work that has been deferred until sleeping is OK
601 */
602void
c4028958 603aoecmd_sleepwork(struct work_struct *work)
3ae1c24e 604{
c4028958 605 struct aoedev *d = container_of(work, struct aoedev, work);
3ae1c24e
EC
606
607 if (d->flags & DEVFL_GDALLOC)
608 aoeblk_gdalloc(d);
609
610 if (d->flags & DEVFL_NEWSIZE) {
611 struct block_device *bd;
612 unsigned long flags;
613 u64 ssize;
614
80795aef 615 ssize = get_capacity(d->gd);
3ae1c24e
EC
616 bd = bdget_disk(d->gd, 0);
617
618 if (bd) {
619 mutex_lock(&bd->bd_inode->i_mutex);
620 i_size_write(bd->bd_inode, (loff_t)ssize<<9);
621 mutex_unlock(&bd->bd_inode->i_mutex);
622 bdput(bd);
623 }
624 spin_lock_irqsave(&d->lock, flags);
625 d->flags |= DEVFL_UP;
626 d->flags &= ~DEVFL_NEWSIZE;
627 spin_unlock_irqrestore(&d->lock, flags);
628 }
629}
630
1da177e4 631static void
68e0d42f 632ataid_complete(struct aoedev *d, struct aoetgt *t, unsigned char *id)
1da177e4
LT
633{
634 u64 ssize;
635 u16 n;
636
637 /* word 83: command set supported */
f885f8d1 638 n = get_unaligned_le16(&id[83 << 1]);
1da177e4
LT
639
640 /* word 86: command set/feature enabled */
f885f8d1 641 n |= get_unaligned_le16(&id[86 << 1]);
1da177e4
LT
642
643 if (n & (1<<10)) { /* bit 10: LBA 48 */
644 d->flags |= DEVFL_EXT;
645
646 /* word 100: number lba48 sectors */
f885f8d1 647 ssize = get_unaligned_le64(&id[100 << 1]);
1da177e4
LT
648
649 /* set as in ide-disk.c:init_idedisk_capacity */
650 d->geo.cylinders = ssize;
651 d->geo.cylinders /= (255 * 63);
652 d->geo.heads = 255;
653 d->geo.sectors = 63;
654 } else {
655 d->flags &= ~DEVFL_EXT;
656
657 /* number lba28 sectors */
f885f8d1 658 ssize = get_unaligned_le32(&id[60 << 1]);
1da177e4
LT
659
660 /* NOTE: obsolete in ATA 6 */
f885f8d1
HH
661 d->geo.cylinders = get_unaligned_le16(&id[54 << 1]);
662 d->geo.heads = get_unaligned_le16(&id[55 << 1]);
663 d->geo.sectors = get_unaligned_le16(&id[56 << 1]);
1da177e4 664 }
3ae1c24e
EC
665
666 if (d->ssize != ssize)
1d75981a 667 printk(KERN_INFO
411c41ee
HH
668 "aoe: %pm e%ld.%d v%04x has %llu sectors\n",
669 t->addr,
3ae1c24e
EC
670 d->aoemajor, d->aoeminor,
671 d->fw_ver, (long long)ssize);
1da177e4
LT
672 d->ssize = ssize;
673 d->geo.start = 0;
6b9699bb
EC
674 if (d->flags & (DEVFL_GDALLOC|DEVFL_NEWSIZE))
675 return;
1da177e4 676 if (d->gd != NULL) {
80795aef 677 set_capacity(d->gd, ssize);
3ae1c24e 678 d->flags |= DEVFL_NEWSIZE;
68e0d42f 679 } else
3ae1c24e 680 d->flags |= DEVFL_GDALLOC;
1da177e4 681 schedule_work(&d->work);
1da177e4
LT
682}
683
684static void
685calc_rttavg(struct aoedev *d, int rtt)
686{
687 register long n;
688
689 n = rtt;
dced3a05
EC
690 if (n < 0) {
691 n = -rtt;
692 if (n < MINTIMER)
693 n = MINTIMER;
694 else if (n > MAXTIMER)
695 n = MAXTIMER;
696 d->mintimer += (n - d->mintimer) >> 1;
697 } else if (n < d->mintimer)
698 n = d->mintimer;
1da177e4
LT
699 else if (n > MAXTIMER)
700 n = MAXTIMER;
701
702 /* g == .25; cf. Congestion Avoidance and Control, Jacobson & Karels; 1988 */
703 n -= d->rttavg;
704 d->rttavg += n >> 2;
705}
706
68e0d42f
EC
707static struct aoetgt *
708gettgt(struct aoedev *d, char *addr)
709{
710 struct aoetgt **t, **e;
711
712 t = d->targets;
713 e = t + NTARGETS;
714 for (; t < e && *t; t++)
715 if (memcmp((*t)->addr, addr, sizeof((*t)->addr)) == 0)
716 return *t;
717 return NULL;
718}
719
720static inline void
03054de1 721diskstats(struct gendisk *disk, struct bio *bio, ulong duration, sector_t sector)
68e0d42f
EC
722{
723 unsigned long n_sect = bio->bi_size >> 9;
724 const int rw = bio_data_dir(bio);
28f13702 725 struct hd_struct *part;
c9959059 726 int cpu;
68e0d42f 727
074a7aca 728 cpu = part_stat_lock();
e71bf0d0 729 part = disk_map_sector_rcu(disk, sector);
e71bf0d0 730
074a7aca
TH
731 part_stat_inc(cpu, part, ios[rw]);
732 part_stat_add(cpu, part, ticks[rw], duration);
733 part_stat_add(cpu, part, sectors[rw], n_sect);
734 part_stat_add(cpu, part, io_ticks, duration);
c9959059 735
074a7aca 736 part_stat_unlock();
68e0d42f
EC
737}
738
1da177e4
LT
739void
740aoecmd_ata_rsp(struct sk_buff *skb)
741{
e9bb8fb0 742 struct sk_buff_head queue;
1da177e4 743 struct aoedev *d;
ddec63e8 744 struct aoe_hdr *hin, *hout;
1da177e4
LT
745 struct aoe_atahdr *ahin, *ahout;
746 struct frame *f;
747 struct buf *buf;
68e0d42f
EC
748 struct aoetgt *t;
749 struct aoeif *ifp;
1da177e4
LT
750 register long n;
751 ulong flags;
752 char ebuf[128];
32465c65
EC
753 u16 aoemajor;
754
abdbf94d 755 hin = (struct aoe_hdr *) skb_mac_header(skb);
f885f8d1 756 aoemajor = get_unaligned_be16(&hin->major);
32465c65 757 d = aoedev_by_aoeaddr(aoemajor, hin->minor);
1da177e4
LT
758 if (d == NULL) {
759 snprintf(ebuf, sizeof ebuf, "aoecmd_ata_rsp: ata response "
760 "for unknown device %d.%d\n",
32465c65 761 aoemajor, hin->minor);
1da177e4
LT
762 aoechr_error(ebuf);
763 return;
764 }
765
766 spin_lock_irqsave(&d->lock, flags);
767
f885f8d1 768 n = get_unaligned_be32(&hin->tag);
68e0d42f
EC
769 t = gettgt(d, hin->src);
770 if (t == NULL) {
411c41ee
HH
771 printk(KERN_INFO "aoe: can't find target e%ld.%d:%pm\n",
772 d->aoemajor, d->aoeminor, hin->src);
68e0d42f
EC
773 spin_unlock_irqrestore(&d->lock, flags);
774 return;
775 }
776 f = getframe(t, n);
1da177e4 777 if (f == NULL) {
dced3a05 778 calc_rttavg(d, -tsince(n));
1da177e4
LT
779 spin_unlock_irqrestore(&d->lock, flags);
780 snprintf(ebuf, sizeof ebuf,
781 "%15s e%d.%d tag=%08x@%08lx\n",
782 "unexpected rsp",
f885f8d1 783 get_unaligned_be16(&hin->major),
1da177e4 784 hin->minor,
f885f8d1 785 get_unaligned_be32(&hin->tag),
1da177e4
LT
786 jiffies);
787 aoechr_error(ebuf);
788 return;
789 }
790
791 calc_rttavg(d, tsince(f->tag));
792
793 ahin = (struct aoe_atahdr *) (hin+1);
abdbf94d 794 hout = (struct aoe_hdr *) skb_mac_header(f->skb);
ddec63e8 795 ahout = (struct aoe_atahdr *) (hout+1);
1da177e4
LT
796 buf = f->buf;
797
798 if (ahin->cmdstat & 0xa9) { /* these bits cleared on success */
a12c93f0 799 printk(KERN_ERR
1d75981a 800 "aoe: ata error cmd=%2.2Xh stat=%2.2Xh from e%ld.%d\n",
1da177e4
LT
801 ahout->cmdstat, ahin->cmdstat,
802 d->aoemajor, d->aoeminor);
803 if (buf)
804 buf->flags |= BUFFL_FAIL;
805 } else {
68e0d42f
EC
806 if (d->htgt && t == *d->htgt) /* I'll help myself, thank you. */
807 d->htgt = NULL;
19bf2635 808 n = ahout->scnt << 9;
1da177e4 809 switch (ahout->cmdstat) {
04b3ab52
BZ
810 case ATA_CMD_PIO_READ:
811 case ATA_CMD_PIO_READ_EXT:
1da177e4 812 if (skb->len - sizeof *hin - sizeof *ahin < n) {
a12c93f0 813 printk(KERN_ERR
68e0d42f
EC
814 "aoe: %s. skb->len=%d need=%ld\n",
815 "runt data size in read", skb->len, n);
1da177e4
LT
816 /* fail frame f? just returning will rexmit. */
817 spin_unlock_irqrestore(&d->lock, flags);
818 return;
819 }
820 memcpy(f->bufaddr, ahin+1, n);
04b3ab52
BZ
821 case ATA_CMD_PIO_WRITE:
822 case ATA_CMD_PIO_WRITE_EXT:
68e0d42f
EC
823 ifp = getif(t, skb->dev);
824 if (ifp) {
825 ifp->lost = 0;
826 if (n > DEFAULTBCNT)
827 ifp->lostjumbo = 0;
828 }
19bf2635 829 if (f->bcnt -= n) {
68e0d42f 830 f->lba += n >> 9;
19bf2635 831 f->bufaddr += n;
68e0d42f
EC
832 resend(d, t, f);
833 goto xmit;
19bf2635 834 }
1da177e4 835 break;
04b3ab52 836 case ATA_CMD_ID_ATA:
1da177e4 837 if (skb->len - sizeof *hin - sizeof *ahin < 512) {
a12c93f0
EC
838 printk(KERN_INFO
839 "aoe: runt data size in ataid. skb->len=%d\n",
6bb6285f 840 skb->len);
1da177e4
LT
841 spin_unlock_irqrestore(&d->lock, flags);
842 return;
843 }
68e0d42f 844 ataid_complete(d, t, (char *) (ahin+1));
1da177e4
LT
845 break;
846 default:
a12c93f0
EC
847 printk(KERN_INFO
848 "aoe: unrecognized ata command %2.2Xh for %d.%d\n",
6bb6285f 849 ahout->cmdstat,
f885f8d1 850 get_unaligned_be16(&hin->major),
6bb6285f 851 hin->minor);
1da177e4
LT
852 }
853 }
854
68e0d42f 855 if (buf && --buf->nframesout == 0 && buf->resid == 0) {
03054de1 856 diskstats(d->gd, buf->bio, jiffies - buf->stime, buf->sector);
0a1f127a
PH
857 if (buf->flags & BUFFL_FAIL)
858 bio_endio(buf->bio, -EIO);
859 else {
6ec1480d 860 bio_flush_dcache_pages(buf->bio);
0a1f127a
PH
861 bio_endio(buf->bio, 0);
862 }
68e0d42f 863 mempool_free(buf, d->bufpool);
1da177e4
LT
864 }
865
866 f->buf = NULL;
867 f->tag = FREETAG;
68e0d42f 868 t->nout--;
1da177e4
LT
869
870 aoecmd_work(d);
68e0d42f 871xmit:
e9bb8fb0
DM
872 __skb_queue_head_init(&queue);
873 skb_queue_splice_init(&d->sendq, &queue);
1da177e4
LT
874
875 spin_unlock_irqrestore(&d->lock, flags);
e9bb8fb0 876 aoenet_xmit(&queue);
1da177e4
LT
877}
878
879void
880aoecmd_cfg(ushort aoemajor, unsigned char aoeminor)
881{
e9bb8fb0 882 struct sk_buff_head queue;
1da177e4 883
e9bb8fb0
DM
884 __skb_queue_head_init(&queue);
885 aoecmd_cfg_pkts(aoemajor, aoeminor, &queue);
886 aoenet_xmit(&queue);
1da177e4
LT
887}
888
68e0d42f 889struct sk_buff *
1da177e4
LT
890aoecmd_ata_id(struct aoedev *d)
891{
892 struct aoe_hdr *h;
893 struct aoe_atahdr *ah;
894 struct frame *f;
895 struct sk_buff *skb;
68e0d42f 896 struct aoetgt *t;
1da177e4 897
4f51dc5e 898 f = freeframe(d);
68e0d42f 899 if (f == NULL)
1da177e4 900 return NULL;
68e0d42f
EC
901
902 t = *d->tgt;
1da177e4
LT
903
904 /* initialize the headers & frame */
e407a7f6 905 skb = f->skb;
abdbf94d 906 h = (struct aoe_hdr *) skb_mac_header(skb);
1da177e4 907 ah = (struct aoe_atahdr *) (h+1);
19900cde
EC
908 skb_put(skb, sizeof *h + sizeof *ah);
909 memset(h, 0, skb->len);
68e0d42f
EC
910 f->tag = aoehdr_atainit(d, t, h);
911 t->nout++;
1da177e4 912 f->waited = 0;
1da177e4 913
1da177e4
LT
914 /* set up ata header */
915 ah->scnt = 1;
04b3ab52 916 ah->cmdstat = ATA_CMD_ID_ATA;
1da177e4
LT
917 ah->lba3 = 0xa0;
918
68e0d42f 919 skb->dev = t->ifp->nd;
1da177e4 920
3ae1c24e 921 d->rttavg = MAXTIMER;
1da177e4 922 d->timer.function = rexmit_timer;
1da177e4 923
4f51dc5e 924 return skb_clone(skb, GFP_ATOMIC);
1da177e4
LT
925}
926
68e0d42f
EC
927static struct aoetgt *
928addtgt(struct aoedev *d, char *addr, ulong nframes)
929{
930 struct aoetgt *t, **tt, **te;
931 struct frame *f, *e;
932
933 tt = d->targets;
934 te = tt + NTARGETS;
935 for (; tt < te && *tt; tt++)
936 ;
937
578c4aa0
EC
938 if (tt == te) {
939 printk(KERN_INFO
940 "aoe: device addtgt failure; too many targets\n");
68e0d42f 941 return NULL;
578c4aa0 942 }
68e0d42f
EC
943 t = kcalloc(1, sizeof *t, GFP_ATOMIC);
944 f = kcalloc(nframes, sizeof *f, GFP_ATOMIC);
578c4aa0
EC
945 if (!t || !f) {
946 kfree(f);
9bb237b6 947 kfree(t);
578c4aa0 948 printk(KERN_INFO "aoe: cannot allocate memory to add target\n");
9bb237b6
EC
949 return NULL;
950 }
951
68e0d42f
EC
952 t->nframes = nframes;
953 t->frames = f;
954 e = f + nframes;
9bb237b6 955 for (; f < e; f++)
68e0d42f 956 f->tag = FREETAG;
68e0d42f
EC
957 memcpy(t->addr, addr, sizeof t->addr);
958 t->ifp = t->ifs;
959 t->maxout = t->nframes;
960 return *tt = t;
68e0d42f
EC
961}
962
1da177e4
LT
963void
964aoecmd_cfg_rsp(struct sk_buff *skb)
965{
966 struct aoedev *d;
967 struct aoe_hdr *h;
968 struct aoe_cfghdr *ch;
68e0d42f
EC
969 struct aoetgt *t;
970 struct aoeif *ifp;
63e9cc5d 971 ulong flags, sysminor, aoemajor;
1da177e4 972 struct sk_buff *sl;
19bf2635 973 u16 n;
1da177e4 974
abdbf94d 975 h = (struct aoe_hdr *) skb_mac_header(skb);
1da177e4
LT
976 ch = (struct aoe_cfghdr *) (h+1);
977
978 /*
979 * Enough people have their dip switches set backwards to
980 * warrant a loud message for this special case.
981 */
823ed72e 982 aoemajor = get_unaligned_be16(&h->major);
1da177e4 983 if (aoemajor == 0xfff) {
a12c93f0 984 printk(KERN_ERR "aoe: Warning: shelf address is all ones. "
6bb6285f 985 "Check shelf dip switches.\n");
1da177e4
LT
986 return;
987 }
988
989 sysminor = SYSMINOR(aoemajor, h->minor);
fc458dcd 990 if (sysminor * AOE_PARTITIONS + AOE_PARTITIONS > MINORMASK) {
a12c93f0 991 printk(KERN_INFO "aoe: e%ld.%d: minor number too large\n",
fc458dcd 992 aoemajor, (int) h->minor);
1da177e4
LT
993 return;
994 }
995
19bf2635 996 n = be16_to_cpu(ch->bufcnt);
7df620d8
EC
997 if (n > aoe_maxout) /* keep it reasonable */
998 n = aoe_maxout;
1da177e4 999
68e0d42f 1000 d = aoedev_by_sysminor_m(sysminor);
1da177e4 1001 if (d == NULL) {
a12c93f0 1002 printk(KERN_INFO "aoe: device sysminor_m failure\n");
1da177e4
LT
1003 return;
1004 }
1005
1006 spin_lock_irqsave(&d->lock, flags);
1007
68e0d42f
EC
1008 t = gettgt(d, h->src);
1009 if (!t) {
1010 t = addtgt(d, h->src, n);
1011 if (!t) {
68e0d42f
EC
1012 spin_unlock_irqrestore(&d->lock, flags);
1013 return;
1014 }
1015 }
1016 ifp = getif(t, skb->dev);
1017 if (!ifp) {
1018 ifp = addif(t, skb->dev);
1019 if (!ifp) {
1020 printk(KERN_INFO
1021 "aoe: device addif failure; "
1022 "too many interfaces?\n");
1023 spin_unlock_irqrestore(&d->lock, flags);
1024 return;
1025 }
1026 }
1027 if (ifp->maxbcnt) {
1028 n = ifp->nd->mtu;
19bf2635
EC
1029 n -= sizeof (struct aoe_hdr) + sizeof (struct aoe_atahdr);
1030 n /= 512;
1031 if (n > ch->scnt)
1032 n = ch->scnt;
4f51dc5e 1033 n = n ? n * 512 : DEFAULTBCNT;
68e0d42f 1034 if (n != ifp->maxbcnt) {
a12c93f0 1035 printk(KERN_INFO
411c41ee 1036 "aoe: e%ld.%d: setting %d%s%s:%pm\n",
68e0d42f
EC
1037 d->aoemajor, d->aoeminor, n,
1038 " byte data frames on ", ifp->nd->name,
411c41ee 1039 t->addr);
68e0d42f 1040 ifp->maxbcnt = n;
4f51dc5e 1041 }
19bf2635 1042 }
3ae1c24e
EC
1043
1044 /* don't change users' perspective */
68e0d42f 1045 if (d->nopen) {
1da177e4
LT
1046 spin_unlock_irqrestore(&d->lock, flags);
1047 return;
1048 }
63e9cc5d 1049 d->fw_ver = be16_to_cpu(ch->fwver);
1da177e4 1050
68e0d42f 1051 sl = aoecmd_ata_id(d);
1da177e4
LT
1052
1053 spin_unlock_irqrestore(&d->lock, flags);
1054
e9bb8fb0
DM
1055 if (sl) {
1056 struct sk_buff_head queue;
1057 __skb_queue_head_init(&queue);
1058 __skb_queue_tail(&queue, sl);
1059 aoenet_xmit(&queue);
1060 }
1da177e4
LT
1061}
1062
68e0d42f
EC
1063void
1064aoecmd_cleanslate(struct aoedev *d)
1065{
1066 struct aoetgt **t, **te;
1067 struct aoeif *p, *e;
1068
1069 d->mintimer = MINTIMER;
1070
1071 t = d->targets;
1072 te = t + NTARGETS;
1073 for (; t < te && *t; t++) {
1074 (*t)->maxout = (*t)->nframes;
1075 p = (*t)->ifs;
1076 e = p + NAOEIFS;
1077 for (; p < e; p++) {
1078 p->lostjumbo = 0;
1079 p->lost = 0;
1080 p->maxbcnt = DEFAULTBCNT;
1081 }
1082 }
1083}