Merge branch 'perf-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...
[pandora-kernel.git] / drivers / usb / host / ehci-sched.c
1 /*
2  * Copyright (c) 2001-2004 by David Brownell
3  * Copyright (c) 2003 Michal Sojka, for high-speed iso transfers
4  *
5  * This program is free software; you can redistribute it and/or modify it
6  * under the terms of the GNU General Public License as published by the
7  * Free Software Foundation; either version 2 of the License, or (at your
8  * option) any later version.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
12  * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
13  * for more details.
14  *
15  * You should have received a copy of the GNU General Public License
16  * along with this program; if not, write to the Free Software Foundation,
17  * Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
18  */
19
20 /* this file is part of ehci-hcd.c */
21
22 /*-------------------------------------------------------------------------*/
23
24 /*
25  * EHCI scheduled transaction support:  interrupt, iso, split iso
26  * These are called "periodic" transactions in the EHCI spec.
27  *
28  * Note that for interrupt transfers, the QH/QTD manipulation is shared
29  * with the "asynchronous" transaction support (control/bulk transfers).
30  * The only real difference is in how interrupt transfers are scheduled.
31  *
32  * For ISO, we make an "iso_stream" head to serve the same role as a QH.
33  * It keeps track of every ITD (or SITD) that's linked, and holds enough
34  * pre-calculated schedule data to make appending to the queue be quick.
35  */
36
37 static int ehci_get_frame (struct usb_hcd *hcd);
38
39 /*-------------------------------------------------------------------------*/
40
41 /*
42  * periodic_next_shadow - return "next" pointer on shadow list
43  * @periodic: host pointer to qh/itd/sitd
44  * @tag: hardware tag for type of this record
45  */
46 static union ehci_shadow *
47 periodic_next_shadow(struct ehci_hcd *ehci, union ehci_shadow *periodic,
48                 __hc32 tag)
49 {
50         switch (hc32_to_cpu(ehci, tag)) {
51         case Q_TYPE_QH:
52                 return &periodic->qh->qh_next;
53         case Q_TYPE_FSTN:
54                 return &periodic->fstn->fstn_next;
55         case Q_TYPE_ITD:
56                 return &periodic->itd->itd_next;
57         // case Q_TYPE_SITD:
58         default:
59                 return &periodic->sitd->sitd_next;
60         }
61 }
62
63 static __hc32 *
64 shadow_next_periodic(struct ehci_hcd *ehci, union ehci_shadow *periodic,
65                 __hc32 tag)
66 {
67         switch (hc32_to_cpu(ehci, tag)) {
68         /* our ehci_shadow.qh is actually software part */
69         case Q_TYPE_QH:
70                 return &periodic->qh->hw->hw_next;
71         /* others are hw parts */
72         default:
73                 return periodic->hw_next;
74         }
75 }
76
77 /* caller must hold ehci->lock */
78 static void periodic_unlink (struct ehci_hcd *ehci, unsigned frame, void *ptr)
79 {
80         union ehci_shadow       *prev_p = &ehci->pshadow[frame];
81         __hc32                  *hw_p = &ehci->periodic[frame];
82         union ehci_shadow       here = *prev_p;
83
84         /* find predecessor of "ptr"; hw and shadow lists are in sync */
85         while (here.ptr && here.ptr != ptr) {
86                 prev_p = periodic_next_shadow(ehci, prev_p,
87                                 Q_NEXT_TYPE(ehci, *hw_p));
88                 hw_p = shadow_next_periodic(ehci, &here,
89                                 Q_NEXT_TYPE(ehci, *hw_p));
90                 here = *prev_p;
91         }
92         /* an interrupt entry (at list end) could have been shared */
93         if (!here.ptr)
94                 return;
95
96         /* update shadow and hardware lists ... the old "next" pointers
97          * from ptr may still be in use, the caller updates them.
98          */
99         *prev_p = *periodic_next_shadow(ehci, &here,
100                         Q_NEXT_TYPE(ehci, *hw_p));
101         *hw_p = *shadow_next_periodic(ehci, &here, Q_NEXT_TYPE(ehci, *hw_p));
102 }
103
104 /* how many of the uframe's 125 usecs are allocated? */
105 static unsigned short
106 periodic_usecs (struct ehci_hcd *ehci, unsigned frame, unsigned uframe)
107 {
108         __hc32                  *hw_p = &ehci->periodic [frame];
109         union ehci_shadow       *q = &ehci->pshadow [frame];
110         unsigned                usecs = 0;
111         struct ehci_qh_hw       *hw;
112
113         while (q->ptr) {
114                 switch (hc32_to_cpu(ehci, Q_NEXT_TYPE(ehci, *hw_p))) {
115                 case Q_TYPE_QH:
116                         hw = q->qh->hw;
117                         /* is it in the S-mask? */
118                         if (hw->hw_info2 & cpu_to_hc32(ehci, 1 << uframe))
119                                 usecs += q->qh->usecs;
120                         /* ... or C-mask? */
121                         if (hw->hw_info2 & cpu_to_hc32(ehci,
122                                         1 << (8 + uframe)))
123                                 usecs += q->qh->c_usecs;
124                         hw_p = &hw->hw_next;
125                         q = &q->qh->qh_next;
126                         break;
127                 // case Q_TYPE_FSTN:
128                 default:
129                         /* for "save place" FSTNs, count the relevant INTR
130                          * bandwidth from the previous frame
131                          */
132                         if (q->fstn->hw_prev != EHCI_LIST_END(ehci)) {
133                                 ehci_dbg (ehci, "ignoring FSTN cost ...\n");
134                         }
135                         hw_p = &q->fstn->hw_next;
136                         q = &q->fstn->fstn_next;
137                         break;
138                 case Q_TYPE_ITD:
139                         if (q->itd->hw_transaction[uframe])
140                                 usecs += q->itd->stream->usecs;
141                         hw_p = &q->itd->hw_next;
142                         q = &q->itd->itd_next;
143                         break;
144                 case Q_TYPE_SITD:
145                         /* is it in the S-mask?  (count SPLIT, DATA) */
146                         if (q->sitd->hw_uframe & cpu_to_hc32(ehci,
147                                         1 << uframe)) {
148                                 if (q->sitd->hw_fullspeed_ep &
149                                                 cpu_to_hc32(ehci, 1<<31))
150                                         usecs += q->sitd->stream->usecs;
151                                 else    /* worst case for OUT start-split */
152                                         usecs += HS_USECS_ISO (188);
153                         }
154
155                         /* ... C-mask?  (count CSPLIT, DATA) */
156                         if (q->sitd->hw_uframe &
157                                         cpu_to_hc32(ehci, 1 << (8 + uframe))) {
158                                 /* worst case for IN complete-split */
159                                 usecs += q->sitd->stream->c_usecs;
160                         }
161
162                         hw_p = &q->sitd->hw_next;
163                         q = &q->sitd->sitd_next;
164                         break;
165                 }
166         }
167 #ifdef  DEBUG
168         if (usecs > 100)
169                 ehci_err (ehci, "uframe %d sched overrun: %d usecs\n",
170                         frame * 8 + uframe, usecs);
171 #endif
172         return usecs;
173 }
174
175 /*-------------------------------------------------------------------------*/
176
177 static int same_tt (struct usb_device *dev1, struct usb_device *dev2)
178 {
179         if (!dev1->tt || !dev2->tt)
180                 return 0;
181         if (dev1->tt != dev2->tt)
182                 return 0;
183         if (dev1->tt->multi)
184                 return dev1->ttport == dev2->ttport;
185         else
186                 return 1;
187 }
188
189 #ifdef CONFIG_USB_EHCI_TT_NEWSCHED
190
191 /* Which uframe does the low/fullspeed transfer start in?
192  *
193  * The parameter is the mask of ssplits in "H-frame" terms
194  * and this returns the transfer start uframe in "B-frame" terms,
195  * which allows both to match, e.g. a ssplit in "H-frame" uframe 0
196  * will cause a transfer in "B-frame" uframe 0.  "B-frames" lag
197  * "H-frames" by 1 uframe.  See the EHCI spec sec 4.5 and figure 4.7.
198  */
199 static inline unsigned char tt_start_uframe(struct ehci_hcd *ehci, __hc32 mask)
200 {
201         unsigned char smask = QH_SMASK & hc32_to_cpu(ehci, mask);
202         if (!smask) {
203                 ehci_err(ehci, "invalid empty smask!\n");
204                 /* uframe 7 can't have bw so this will indicate failure */
205                 return 7;
206         }
207         return ffs(smask) - 1;
208 }
209
210 static const unsigned char
211 max_tt_usecs[] = { 125, 125, 125, 125, 125, 125, 30, 0 };
212
213 /* carryover low/fullspeed bandwidth that crosses uframe boundries */
214 static inline void carryover_tt_bandwidth(unsigned short tt_usecs[8])
215 {
216         int i;
217         for (i=0; i<7; i++) {
218                 if (max_tt_usecs[i] < tt_usecs[i]) {
219                         tt_usecs[i+1] += tt_usecs[i] - max_tt_usecs[i];
220                         tt_usecs[i] = max_tt_usecs[i];
221                 }
222         }
223 }
224
225 /* How many of the tt's periodic downstream 1000 usecs are allocated?
226  *
227  * While this measures the bandwidth in terms of usecs/uframe,
228  * the low/fullspeed bus has no notion of uframes, so any particular
229  * low/fullspeed transfer can "carry over" from one uframe to the next,
230  * since the TT just performs downstream transfers in sequence.
231  *
232  * For example two separate 100 usec transfers can start in the same uframe,
233  * and the second one would "carry over" 75 usecs into the next uframe.
234  */
235 static void
236 periodic_tt_usecs (
237         struct ehci_hcd *ehci,
238         struct usb_device *dev,
239         unsigned frame,
240         unsigned short tt_usecs[8]
241 )
242 {
243         __hc32                  *hw_p = &ehci->periodic [frame];
244         union ehci_shadow       *q = &ehci->pshadow [frame];
245         unsigned char           uf;
246
247         memset(tt_usecs, 0, 16);
248
249         while (q->ptr) {
250                 switch (hc32_to_cpu(ehci, Q_NEXT_TYPE(ehci, *hw_p))) {
251                 case Q_TYPE_ITD:
252                         hw_p = &q->itd->hw_next;
253                         q = &q->itd->itd_next;
254                         continue;
255                 case Q_TYPE_QH:
256                         if (same_tt(dev, q->qh->dev)) {
257                                 uf = tt_start_uframe(ehci, q->qh->hw->hw_info2);
258                                 tt_usecs[uf] += q->qh->tt_usecs;
259                         }
260                         hw_p = &q->qh->hw->hw_next;
261                         q = &q->qh->qh_next;
262                         continue;
263                 case Q_TYPE_SITD:
264                         if (same_tt(dev, q->sitd->urb->dev)) {
265                                 uf = tt_start_uframe(ehci, q->sitd->hw_uframe);
266                                 tt_usecs[uf] += q->sitd->stream->tt_usecs;
267                         }
268                         hw_p = &q->sitd->hw_next;
269                         q = &q->sitd->sitd_next;
270                         continue;
271                 // case Q_TYPE_FSTN:
272                 default:
273                         ehci_dbg(ehci, "ignoring periodic frame %d FSTN\n",
274                                         frame);
275                         hw_p = &q->fstn->hw_next;
276                         q = &q->fstn->fstn_next;
277                 }
278         }
279
280         carryover_tt_bandwidth(tt_usecs);
281
282         if (max_tt_usecs[7] < tt_usecs[7])
283                 ehci_err(ehci, "frame %d tt sched overrun: %d usecs\n",
284                         frame, tt_usecs[7] - max_tt_usecs[7]);
285 }
286
287 /*
288  * Return true if the device's tt's downstream bus is available for a
289  * periodic transfer of the specified length (usecs), starting at the
290  * specified frame/uframe.  Note that (as summarized in section 11.19
291  * of the usb 2.0 spec) TTs can buffer multiple transactions for each
292  * uframe.
293  *
294  * The uframe parameter is when the fullspeed/lowspeed transfer
295  * should be executed in "B-frame" terms, which is the same as the
296  * highspeed ssplit's uframe (which is in "H-frame" terms).  For example
297  * a ssplit in "H-frame" 0 causes a transfer in "B-frame" 0.
298  * See the EHCI spec sec 4.5 and fig 4.7.
299  *
300  * This checks if the full/lowspeed bus, at the specified starting uframe,
301  * has the specified bandwidth available, according to rules listed
302  * in USB 2.0 spec section 11.18.1 fig 11-60.
303  *
304  * This does not check if the transfer would exceed the max ssplit
305  * limit of 16, specified in USB 2.0 spec section 11.18.4 requirement #4,
306  * since proper scheduling limits ssplits to less than 16 per uframe.
307  */
308 static int tt_available (
309         struct ehci_hcd         *ehci,
310         unsigned                period,
311         struct usb_device       *dev,
312         unsigned                frame,
313         unsigned                uframe,
314         u16                     usecs
315 )
316 {
317         if ((period == 0) || (uframe >= 7))     /* error */
318                 return 0;
319
320         for (; frame < ehci->periodic_size; frame += period) {
321                 unsigned short tt_usecs[8];
322
323                 periodic_tt_usecs (ehci, dev, frame, tt_usecs);
324
325                 ehci_vdbg(ehci, "tt frame %d check %d usecs start uframe %d in"
326                         " schedule %d/%d/%d/%d/%d/%d/%d/%d\n",
327                         frame, usecs, uframe,
328                         tt_usecs[0], tt_usecs[1], tt_usecs[2], tt_usecs[3],
329                         tt_usecs[4], tt_usecs[5], tt_usecs[6], tt_usecs[7]);
330
331                 if (max_tt_usecs[uframe] <= tt_usecs[uframe]) {
332                         ehci_vdbg(ehci, "frame %d uframe %d fully scheduled\n",
333                                 frame, uframe);
334                         return 0;
335                 }
336
337                 /* special case for isoc transfers larger than 125us:
338                  * the first and each subsequent fully used uframe
339                  * must be empty, so as to not illegally delay
340                  * already scheduled transactions
341                  */
342                 if (125 < usecs) {
343                         int ufs = (usecs / 125);
344                         int i;
345                         for (i = uframe; i < (uframe + ufs) && i < 8; i++)
346                                 if (0 < tt_usecs[i]) {
347                                         ehci_vdbg(ehci,
348                                                 "multi-uframe xfer can't fit "
349                                                 "in frame %d uframe %d\n",
350                                                 frame, i);
351                                         return 0;
352                                 }
353                 }
354
355                 tt_usecs[uframe] += usecs;
356
357                 carryover_tt_bandwidth(tt_usecs);
358
359                 /* fail if the carryover pushed bw past the last uframe's limit */
360                 if (max_tt_usecs[7] < tt_usecs[7]) {
361                         ehci_vdbg(ehci,
362                                 "tt unavailable usecs %d frame %d uframe %d\n",
363                                 usecs, frame, uframe);
364                         return 0;
365                 }
366         }
367
368         return 1;
369 }
370
371 #else
372
373 /* return true iff the device's transaction translator is available
374  * for a periodic transfer starting at the specified frame, using
375  * all the uframes in the mask.
376  */
377 static int tt_no_collision (
378         struct ehci_hcd         *ehci,
379         unsigned                period,
380         struct usb_device       *dev,
381         unsigned                frame,
382         u32                     uf_mask
383 )
384 {
385         if (period == 0)        /* error */
386                 return 0;
387
388         /* note bandwidth wastage:  split never follows csplit
389          * (different dev or endpoint) until the next uframe.
390          * calling convention doesn't make that distinction.
391          */
392         for (; frame < ehci->periodic_size; frame += period) {
393                 union ehci_shadow       here;
394                 __hc32                  type;
395                 struct ehci_qh_hw       *hw;
396
397                 here = ehci->pshadow [frame];
398                 type = Q_NEXT_TYPE(ehci, ehci->periodic [frame]);
399                 while (here.ptr) {
400                         switch (hc32_to_cpu(ehci, type)) {
401                         case Q_TYPE_ITD:
402                                 type = Q_NEXT_TYPE(ehci, here.itd->hw_next);
403                                 here = here.itd->itd_next;
404                                 continue;
405                         case Q_TYPE_QH:
406                                 hw = here.qh->hw;
407                                 if (same_tt (dev, here.qh->dev)) {
408                                         u32             mask;
409
410                                         mask = hc32_to_cpu(ehci,
411                                                         hw->hw_info2);
412                                         /* "knows" no gap is needed */
413                                         mask |= mask >> 8;
414                                         if (mask & uf_mask)
415                                                 break;
416                                 }
417                                 type = Q_NEXT_TYPE(ehci, hw->hw_next);
418                                 here = here.qh->qh_next;
419                                 continue;
420                         case Q_TYPE_SITD:
421                                 if (same_tt (dev, here.sitd->urb->dev)) {
422                                         u16             mask;
423
424                                         mask = hc32_to_cpu(ehci, here.sitd
425                                                                 ->hw_uframe);
426                                         /* FIXME assumes no gap for IN! */
427                                         mask |= mask >> 8;
428                                         if (mask & uf_mask)
429                                                 break;
430                                 }
431                                 type = Q_NEXT_TYPE(ehci, here.sitd->hw_next);
432                                 here = here.sitd->sitd_next;
433                                 continue;
434                         // case Q_TYPE_FSTN:
435                         default:
436                                 ehci_dbg (ehci,
437                                         "periodic frame %d bogus type %d\n",
438                                         frame, type);
439                         }
440
441                         /* collision or error */
442                         return 0;
443                 }
444         }
445
446         /* no collision */
447         return 1;
448 }
449
450 #endif /* CONFIG_USB_EHCI_TT_NEWSCHED */
451
452 /*-------------------------------------------------------------------------*/
453
454 static int enable_periodic (struct ehci_hcd *ehci)
455 {
456         u32     cmd;
457         int     status;
458
459         if (ehci->periodic_sched++)
460                 return 0;
461
462         /* did clearing PSE did take effect yet?
463          * takes effect only at frame boundaries...
464          */
465         status = handshake_on_error_set_halt(ehci, &ehci->regs->status,
466                                              STS_PSS, 0, 9 * 125);
467         if (status)
468                 return status;
469
470         cmd = ehci_readl(ehci, &ehci->regs->command) | CMD_PSE;
471         ehci_writel(ehci, cmd, &ehci->regs->command);
472         /* posted write ... PSS happens later */
473         ehci_to_hcd(ehci)->state = HC_STATE_RUNNING;
474
475         /* make sure ehci_work scans these */
476         ehci->next_uframe = ehci_readl(ehci, &ehci->regs->frame_index)
477                 % (ehci->periodic_size << 3);
478         if (unlikely(ehci->broken_periodic))
479                 ehci->last_periodic_enable = ktime_get_real();
480         return 0;
481 }
482
483 static int disable_periodic (struct ehci_hcd *ehci)
484 {
485         u32     cmd;
486         int     status;
487
488         if (--ehci->periodic_sched)
489                 return 0;
490
491         if (unlikely(ehci->broken_periodic)) {
492                 /* delay experimentally determined */
493                 ktime_t safe = ktime_add_us(ehci->last_periodic_enable, 1000);
494                 ktime_t now = ktime_get_real();
495                 s64 delay = ktime_us_delta(safe, now);
496
497                 if (unlikely(delay > 0))
498                         udelay(delay);
499         }
500
501         /* did setting PSE not take effect yet?
502          * takes effect only at frame boundaries...
503          */
504         status = handshake_on_error_set_halt(ehci, &ehci->regs->status,
505                                              STS_PSS, STS_PSS, 9 * 125);
506         if (status)
507                 return status;
508
509         cmd = ehci_readl(ehci, &ehci->regs->command) & ~CMD_PSE;
510         ehci_writel(ehci, cmd, &ehci->regs->command);
511         /* posted write ... */
512
513         free_cached_lists(ehci);
514
515         ehci->next_uframe = -1;
516         return 0;
517 }
518
519 /*-------------------------------------------------------------------------*/
520
521 /* periodic schedule slots have iso tds (normal or split) first, then a
522  * sparse tree for active interrupt transfers.
523  *
524  * this just links in a qh; caller guarantees uframe masks are set right.
525  * no FSTN support (yet; ehci 0.96+)
526  */
527 static int qh_link_periodic (struct ehci_hcd *ehci, struct ehci_qh *qh)
528 {
529         unsigned        i;
530         unsigned        period = qh->period;
531
532         dev_dbg (&qh->dev->dev,
533                 "link qh%d-%04x/%p start %d [%d/%d us]\n",
534                 period, hc32_to_cpup(ehci, &qh->hw->hw_info2)
535                         & (QH_CMASK | QH_SMASK),
536                 qh, qh->start, qh->usecs, qh->c_usecs);
537
538         /* high bandwidth, or otherwise every microframe */
539         if (period == 0)
540                 period = 1;
541
542         for (i = qh->start; i < ehci->periodic_size; i += period) {
543                 union ehci_shadow       *prev = &ehci->pshadow[i];
544                 __hc32                  *hw_p = &ehci->periodic[i];
545                 union ehci_shadow       here = *prev;
546                 __hc32                  type = 0;
547
548                 /* skip the iso nodes at list head */
549                 while (here.ptr) {
550                         type = Q_NEXT_TYPE(ehci, *hw_p);
551                         if (type == cpu_to_hc32(ehci, Q_TYPE_QH))
552                                 break;
553                         prev = periodic_next_shadow(ehci, prev, type);
554                         hw_p = shadow_next_periodic(ehci, &here, type);
555                         here = *prev;
556                 }
557
558                 /* sorting each branch by period (slow-->fast)
559                  * enables sharing interior tree nodes
560                  */
561                 while (here.ptr && qh != here.qh) {
562                         if (qh->period > here.qh->period)
563                                 break;
564                         prev = &here.qh->qh_next;
565                         hw_p = &here.qh->hw->hw_next;
566                         here = *prev;
567                 }
568                 /* link in this qh, unless some earlier pass did that */
569                 if (qh != here.qh) {
570                         qh->qh_next = here;
571                         if (here.qh)
572                                 qh->hw->hw_next = *hw_p;
573                         wmb ();
574                         prev->qh = qh;
575                         *hw_p = QH_NEXT (ehci, qh->qh_dma);
576                 }
577         }
578         qh->qh_state = QH_STATE_LINKED;
579         qh->xacterrs = 0;
580         qh_get (qh);
581
582         /* update per-qh bandwidth for usbfs */
583         ehci_to_hcd(ehci)->self.bandwidth_allocated += qh->period
584                 ? ((qh->usecs + qh->c_usecs) / qh->period)
585                 : (qh->usecs * 8);
586
587         /* maybe enable periodic schedule processing */
588         return enable_periodic(ehci);
589 }
590
591 static int qh_unlink_periodic(struct ehci_hcd *ehci, struct ehci_qh *qh)
592 {
593         unsigned        i;
594         unsigned        period;
595
596         // FIXME:
597         // IF this isn't high speed
598         //   and this qh is active in the current uframe
599         //   (and overlay token SplitXstate is false?)
600         // THEN
601         //   qh->hw_info1 |= cpu_to_hc32(1 << 7 /* "ignore" */);
602
603         /* high bandwidth, or otherwise part of every microframe */
604         if ((period = qh->period) == 0)
605                 period = 1;
606
607         for (i = qh->start; i < ehci->periodic_size; i += period)
608                 periodic_unlink (ehci, i, qh);
609
610         /* update per-qh bandwidth for usbfs */
611         ehci_to_hcd(ehci)->self.bandwidth_allocated -= qh->period
612                 ? ((qh->usecs + qh->c_usecs) / qh->period)
613                 : (qh->usecs * 8);
614
615         dev_dbg (&qh->dev->dev,
616                 "unlink qh%d-%04x/%p start %d [%d/%d us]\n",
617                 qh->period,
618                 hc32_to_cpup(ehci, &qh->hw->hw_info2) & (QH_CMASK | QH_SMASK),
619                 qh, qh->start, qh->usecs, qh->c_usecs);
620
621         /* qh->qh_next still "live" to HC */
622         qh->qh_state = QH_STATE_UNLINK;
623         qh->qh_next.ptr = NULL;
624         qh_put (qh);
625
626         /* maybe turn off periodic schedule */
627         return disable_periodic(ehci);
628 }
629
630 static void intr_deschedule (struct ehci_hcd *ehci, struct ehci_qh *qh)
631 {
632         unsigned                wait;
633         struct ehci_qh_hw       *hw = qh->hw;
634         int                     rc;
635
636         /* If the QH isn't linked then there's nothing we can do
637          * unless we were called during a giveback, in which case
638          * qh_completions() has to deal with it.
639          */
640         if (qh->qh_state != QH_STATE_LINKED) {
641                 if (qh->qh_state == QH_STATE_COMPLETING)
642                         qh->needs_rescan = 1;
643                 return;
644         }
645
646         qh_unlink_periodic (ehci, qh);
647
648         /* simple/paranoid:  always delay, expecting the HC needs to read
649          * qh->hw_next or finish a writeback after SPLIT/CSPLIT ... and
650          * expect khubd to clean up after any CSPLITs we won't issue.
651          * active high speed queues may need bigger delays...
652          */
653         if (list_empty (&qh->qtd_list)
654                         || (cpu_to_hc32(ehci, QH_CMASK)
655                                         & hw->hw_info2) != 0)
656                 wait = 2;
657         else
658                 wait = 55;      /* worst case: 3 * 1024 */
659
660         udelay (wait);
661         qh->qh_state = QH_STATE_IDLE;
662         hw->hw_next = EHCI_LIST_END(ehci);
663         wmb ();
664
665         qh_completions(ehci, qh);
666
667         /* reschedule QH iff another request is queued */
668         if (!list_empty(&qh->qtd_list) &&
669                         HC_IS_RUNNING(ehci_to_hcd(ehci)->state)) {
670                 rc = qh_schedule(ehci, qh);
671
672                 /* An error here likely indicates handshake failure
673                  * or no space left in the schedule.  Neither fault
674                  * should happen often ...
675                  *
676                  * FIXME kill the now-dysfunctional queued urbs
677                  */
678                 if (rc != 0)
679                         ehci_err(ehci, "can't reschedule qh %p, err %d\n",
680                                         qh, rc);
681         }
682 }
683
684 /*-------------------------------------------------------------------------*/
685
686 static int check_period (
687         struct ehci_hcd *ehci,
688         unsigned        frame,
689         unsigned        uframe,
690         unsigned        period,
691         unsigned        usecs
692 ) {
693         int             claimed;
694
695         /* complete split running into next frame?
696          * given FSTN support, we could sometimes check...
697          */
698         if (uframe >= 8)
699                 return 0;
700
701         /*
702          * 80% periodic == 100 usec/uframe available
703          * convert "usecs we need" to "max already claimed"
704          */
705         usecs = 100 - usecs;
706
707         /* we "know" 2 and 4 uframe intervals were rejected; so
708          * for period 0, check _every_ microframe in the schedule.
709          */
710         if (unlikely (period == 0)) {
711                 do {
712                         for (uframe = 0; uframe < 7; uframe++) {
713                                 claimed = periodic_usecs (ehci, frame, uframe);
714                                 if (claimed > usecs)
715                                         return 0;
716                         }
717                 } while ((frame += 1) < ehci->periodic_size);
718
719         /* just check the specified uframe, at that period */
720         } else {
721                 do {
722                         claimed = periodic_usecs (ehci, frame, uframe);
723                         if (claimed > usecs)
724                                 return 0;
725                 } while ((frame += period) < ehci->periodic_size);
726         }
727
728         // success!
729         return 1;
730 }
731
732 static int check_intr_schedule (
733         struct ehci_hcd         *ehci,
734         unsigned                frame,
735         unsigned                uframe,
736         const struct ehci_qh    *qh,
737         __hc32                  *c_maskp
738 )
739 {
740         int             retval = -ENOSPC;
741         u8              mask = 0;
742
743         if (qh->c_usecs && uframe >= 6)         /* FSTN territory? */
744                 goto done;
745
746         if (!check_period (ehci, frame, uframe, qh->period, qh->usecs))
747                 goto done;
748         if (!qh->c_usecs) {
749                 retval = 0;
750                 *c_maskp = 0;
751                 goto done;
752         }
753
754 #ifdef CONFIG_USB_EHCI_TT_NEWSCHED
755         if (tt_available (ehci, qh->period, qh->dev, frame, uframe,
756                                 qh->tt_usecs)) {
757                 unsigned i;
758
759                 /* TODO : this may need FSTN for SSPLIT in uframe 5. */
760                 for (i=uframe+1; i<8 && i<uframe+4; i++)
761                         if (!check_period (ehci, frame, i,
762                                                 qh->period, qh->c_usecs))
763                                 goto done;
764                         else
765                                 mask |= 1 << i;
766
767                 retval = 0;
768
769                 *c_maskp = cpu_to_hc32(ehci, mask << 8);
770         }
771 #else
772         /* Make sure this tt's buffer is also available for CSPLITs.
773          * We pessimize a bit; probably the typical full speed case
774          * doesn't need the second CSPLIT.
775          *
776          * NOTE:  both SPLIT and CSPLIT could be checked in just
777          * one smart pass...
778          */
779         mask = 0x03 << (uframe + qh->gap_uf);
780         *c_maskp = cpu_to_hc32(ehci, mask << 8);
781
782         mask |= 1 << uframe;
783         if (tt_no_collision (ehci, qh->period, qh->dev, frame, mask)) {
784                 if (!check_period (ehci, frame, uframe + qh->gap_uf + 1,
785                                         qh->period, qh->c_usecs))
786                         goto done;
787                 if (!check_period (ehci, frame, uframe + qh->gap_uf,
788                                         qh->period, qh->c_usecs))
789                         goto done;
790                 retval = 0;
791         }
792 #endif
793 done:
794         return retval;
795 }
796
797 /* "first fit" scheduling policy used the first time through,
798  * or when the previous schedule slot can't be re-used.
799  */
800 static int qh_schedule(struct ehci_hcd *ehci, struct ehci_qh *qh)
801 {
802         int             status;
803         unsigned        uframe;
804         __hc32          c_mask;
805         unsigned        frame;          /* 0..(qh->period - 1), or NO_FRAME */
806         struct ehci_qh_hw       *hw = qh->hw;
807
808         qh_refresh(ehci, qh);
809         hw->hw_next = EHCI_LIST_END(ehci);
810         frame = qh->start;
811
812         /* reuse the previous schedule slots, if we can */
813         if (frame < qh->period) {
814                 uframe = ffs(hc32_to_cpup(ehci, &hw->hw_info2) & QH_SMASK);
815                 status = check_intr_schedule (ehci, frame, --uframe,
816                                 qh, &c_mask);
817         } else {
818                 uframe = 0;
819                 c_mask = 0;
820                 status = -ENOSPC;
821         }
822
823         /* else scan the schedule to find a group of slots such that all
824          * uframes have enough periodic bandwidth available.
825          */
826         if (status) {
827                 /* "normal" case, uframing flexible except with splits */
828                 if (qh->period) {
829                         int             i;
830
831                         for (i = qh->period; status && i > 0; --i) {
832                                 frame = ++ehci->random_frame % qh->period;
833                                 for (uframe = 0; uframe < 8; uframe++) {
834                                         status = check_intr_schedule (ehci,
835                                                         frame, uframe, qh,
836                                                         &c_mask);
837                                         if (status == 0)
838                                                 break;
839                                 }
840                         }
841
842                 /* qh->period == 0 means every uframe */
843                 } else {
844                         frame = 0;
845                         status = check_intr_schedule (ehci, 0, 0, qh, &c_mask);
846                 }
847                 if (status)
848                         goto done;
849                 qh->start = frame;
850
851                 /* reset S-frame and (maybe) C-frame masks */
852                 hw->hw_info2 &= cpu_to_hc32(ehci, ~(QH_CMASK | QH_SMASK));
853                 hw->hw_info2 |= qh->period
854                         ? cpu_to_hc32(ehci, 1 << uframe)
855                         : cpu_to_hc32(ehci, QH_SMASK);
856                 hw->hw_info2 |= c_mask;
857         } else
858                 ehci_dbg (ehci, "reused qh %p schedule\n", qh);
859
860         /* stuff into the periodic schedule */
861         status = qh_link_periodic (ehci, qh);
862 done:
863         return status;
864 }
865
866 static int intr_submit (
867         struct ehci_hcd         *ehci,
868         struct urb              *urb,
869         struct list_head        *qtd_list,
870         gfp_t                   mem_flags
871 ) {
872         unsigned                epnum;
873         unsigned long           flags;
874         struct ehci_qh          *qh;
875         int                     status;
876         struct list_head        empty;
877
878         /* get endpoint and transfer/schedule data */
879         epnum = urb->ep->desc.bEndpointAddress;
880
881         spin_lock_irqsave (&ehci->lock, flags);
882
883         if (unlikely(!HCD_HW_ACCESSIBLE(ehci_to_hcd(ehci)))) {
884                 status = -ESHUTDOWN;
885                 goto done_not_linked;
886         }
887         status = usb_hcd_link_urb_to_ep(ehci_to_hcd(ehci), urb);
888         if (unlikely(status))
889                 goto done_not_linked;
890
891         /* get qh and force any scheduling errors */
892         INIT_LIST_HEAD (&empty);
893         qh = qh_append_tds(ehci, urb, &empty, epnum, &urb->ep->hcpriv);
894         if (qh == NULL) {
895                 status = -ENOMEM;
896                 goto done;
897         }
898         if (qh->qh_state == QH_STATE_IDLE) {
899                 if ((status = qh_schedule (ehci, qh)) != 0)
900                         goto done;
901         }
902
903         /* then queue the urb's tds to the qh */
904         qh = qh_append_tds(ehci, urb, qtd_list, epnum, &urb->ep->hcpriv);
905         BUG_ON (qh == NULL);
906
907         /* ... update usbfs periodic stats */
908         ehci_to_hcd(ehci)->self.bandwidth_int_reqs++;
909
910 done:
911         if (unlikely(status))
912                 usb_hcd_unlink_urb_from_ep(ehci_to_hcd(ehci), urb);
913 done_not_linked:
914         spin_unlock_irqrestore (&ehci->lock, flags);
915         if (status)
916                 qtd_list_free (ehci, urb, qtd_list);
917
918         return status;
919 }
920
921 /*-------------------------------------------------------------------------*/
922
923 /* ehci_iso_stream ops work with both ITD and SITD */
924
925 static struct ehci_iso_stream *
926 iso_stream_alloc (gfp_t mem_flags)
927 {
928         struct ehci_iso_stream *stream;
929
930         stream = kzalloc(sizeof *stream, mem_flags);
931         if (likely (stream != NULL)) {
932                 INIT_LIST_HEAD(&stream->td_list);
933                 INIT_LIST_HEAD(&stream->free_list);
934                 stream->next_uframe = -1;
935                 stream->refcount = 1;
936         }
937         return stream;
938 }
939
940 static void
941 iso_stream_init (
942         struct ehci_hcd         *ehci,
943         struct ehci_iso_stream  *stream,
944         struct usb_device       *dev,
945         int                     pipe,
946         unsigned                interval
947 )
948 {
949         static const u8 smask_out [] = { 0x01, 0x03, 0x07, 0x0f, 0x1f, 0x3f };
950
951         u32                     buf1;
952         unsigned                epnum, maxp;
953         int                     is_input;
954         long                    bandwidth;
955
956         /*
957          * this might be a "high bandwidth" highspeed endpoint,
958          * as encoded in the ep descriptor's wMaxPacket field
959          */
960         epnum = usb_pipeendpoint (pipe);
961         is_input = usb_pipein (pipe) ? USB_DIR_IN : 0;
962         maxp = usb_maxpacket(dev, pipe, !is_input);
963         if (is_input) {
964                 buf1 = (1 << 11);
965         } else {
966                 buf1 = 0;
967         }
968
969         /* knows about ITD vs SITD */
970         if (dev->speed == USB_SPEED_HIGH) {
971                 unsigned multi = hb_mult(maxp);
972
973                 stream->highspeed = 1;
974
975                 maxp = max_packet(maxp);
976                 buf1 |= maxp;
977                 maxp *= multi;
978
979                 stream->buf0 = cpu_to_hc32(ehci, (epnum << 8) | dev->devnum);
980                 stream->buf1 = cpu_to_hc32(ehci, buf1);
981                 stream->buf2 = cpu_to_hc32(ehci, multi);
982
983                 /* usbfs wants to report the average usecs per frame tied up
984                  * when transfers on this endpoint are scheduled ...
985                  */
986                 stream->usecs = HS_USECS_ISO (maxp);
987                 bandwidth = stream->usecs * 8;
988                 bandwidth /= interval;
989
990         } else {
991                 u32             addr;
992                 int             think_time;
993                 int             hs_transfers;
994
995                 addr = dev->ttport << 24;
996                 if (!ehci_is_TDI(ehci)
997                                 || (dev->tt->hub !=
998                                         ehci_to_hcd(ehci)->self.root_hub))
999                         addr |= dev->tt->hub->devnum << 16;
1000                 addr |= epnum << 8;
1001                 addr |= dev->devnum;
1002                 stream->usecs = HS_USECS_ISO (maxp);
1003                 think_time = dev->tt ? dev->tt->think_time : 0;
1004                 stream->tt_usecs = NS_TO_US (think_time + usb_calc_bus_time (
1005                                 dev->speed, is_input, 1, maxp));
1006                 hs_transfers = max (1u, (maxp + 187) / 188);
1007                 if (is_input) {
1008                         u32     tmp;
1009
1010                         addr |= 1 << 31;
1011                         stream->c_usecs = stream->usecs;
1012                         stream->usecs = HS_USECS_ISO (1);
1013                         stream->raw_mask = 1;
1014
1015                         /* c-mask as specified in USB 2.0 11.18.4 3.c */
1016                         tmp = (1 << (hs_transfers + 2)) - 1;
1017                         stream->raw_mask |= tmp << (8 + 2);
1018                 } else
1019                         stream->raw_mask = smask_out [hs_transfers - 1];
1020                 bandwidth = stream->usecs + stream->c_usecs;
1021                 bandwidth /= interval << 3;
1022
1023                 /* stream->splits gets created from raw_mask later */
1024                 stream->address = cpu_to_hc32(ehci, addr);
1025         }
1026         stream->bandwidth = bandwidth;
1027
1028         stream->udev = dev;
1029
1030         stream->bEndpointAddress = is_input | epnum;
1031         stream->interval = interval;
1032         stream->maxp = maxp;
1033 }
1034
1035 static void
1036 iso_stream_put(struct ehci_hcd *ehci, struct ehci_iso_stream *stream)
1037 {
1038         stream->refcount--;
1039
1040         /* free whenever just a dev->ep reference remains.
1041          * not like a QH -- no persistent state (toggle, halt)
1042          */
1043         if (stream->refcount == 1) {
1044                 int             is_in;
1045
1046                 // BUG_ON (!list_empty(&stream->td_list));
1047
1048                 while (!list_empty (&stream->free_list)) {
1049                         struct list_head        *entry;
1050
1051                         entry = stream->free_list.next;
1052                         list_del (entry);
1053
1054                         /* knows about ITD vs SITD */
1055                         if (stream->highspeed) {
1056                                 struct ehci_itd         *itd;
1057
1058                                 itd = list_entry (entry, struct ehci_itd,
1059                                                 itd_list);
1060                                 dma_pool_free (ehci->itd_pool, itd,
1061                                                 itd->itd_dma);
1062                         } else {
1063                                 struct ehci_sitd        *sitd;
1064
1065                                 sitd = list_entry (entry, struct ehci_sitd,
1066                                                 sitd_list);
1067                                 dma_pool_free (ehci->sitd_pool, sitd,
1068                                                 sitd->sitd_dma);
1069                         }
1070                 }
1071
1072                 is_in = (stream->bEndpointAddress & USB_DIR_IN) ? 0x10 : 0;
1073                 stream->bEndpointAddress &= 0x0f;
1074                 if (stream->ep)
1075                         stream->ep->hcpriv = NULL;
1076
1077                 kfree(stream);
1078         }
1079 }
1080
1081 static inline struct ehci_iso_stream *
1082 iso_stream_get (struct ehci_iso_stream *stream)
1083 {
1084         if (likely (stream != NULL))
1085                 stream->refcount++;
1086         return stream;
1087 }
1088
1089 static struct ehci_iso_stream *
1090 iso_stream_find (struct ehci_hcd *ehci, struct urb *urb)
1091 {
1092         unsigned                epnum;
1093         struct ehci_iso_stream  *stream;
1094         struct usb_host_endpoint *ep;
1095         unsigned long           flags;
1096
1097         epnum = usb_pipeendpoint (urb->pipe);
1098         if (usb_pipein(urb->pipe))
1099                 ep = urb->dev->ep_in[epnum];
1100         else
1101                 ep = urb->dev->ep_out[epnum];
1102
1103         spin_lock_irqsave (&ehci->lock, flags);
1104         stream = ep->hcpriv;
1105
1106         if (unlikely (stream == NULL)) {
1107                 stream = iso_stream_alloc(GFP_ATOMIC);
1108                 if (likely (stream != NULL)) {
1109                         /* dev->ep owns the initial refcount */
1110                         ep->hcpriv = stream;
1111                         stream->ep = ep;
1112                         iso_stream_init(ehci, stream, urb->dev, urb->pipe,
1113                                         urb->interval);
1114                 }
1115
1116         /* if dev->ep [epnum] is a QH, hw is set */
1117         } else if (unlikely (stream->hw != NULL)) {
1118                 ehci_dbg (ehci, "dev %s ep%d%s, not iso??\n",
1119                         urb->dev->devpath, epnum,
1120                         usb_pipein(urb->pipe) ? "in" : "out");
1121                 stream = NULL;
1122         }
1123
1124         /* caller guarantees an eventual matching iso_stream_put */
1125         stream = iso_stream_get (stream);
1126
1127         spin_unlock_irqrestore (&ehci->lock, flags);
1128         return stream;
1129 }
1130
1131 /*-------------------------------------------------------------------------*/
1132
1133 /* ehci_iso_sched ops can be ITD-only or SITD-only */
1134
1135 static struct ehci_iso_sched *
1136 iso_sched_alloc (unsigned packets, gfp_t mem_flags)
1137 {
1138         struct ehci_iso_sched   *iso_sched;
1139         int                     size = sizeof *iso_sched;
1140
1141         size += packets * sizeof (struct ehci_iso_packet);
1142         iso_sched = kzalloc(size, mem_flags);
1143         if (likely (iso_sched != NULL)) {
1144                 INIT_LIST_HEAD (&iso_sched->td_list);
1145         }
1146         return iso_sched;
1147 }
1148
1149 static inline void
1150 itd_sched_init(
1151         struct ehci_hcd         *ehci,
1152         struct ehci_iso_sched   *iso_sched,
1153         struct ehci_iso_stream  *stream,
1154         struct urb              *urb
1155 )
1156 {
1157         unsigned        i;
1158         dma_addr_t      dma = urb->transfer_dma;
1159
1160         /* how many uframes are needed for these transfers */
1161         iso_sched->span = urb->number_of_packets * stream->interval;
1162
1163         /* figure out per-uframe itd fields that we'll need later
1164          * when we fit new itds into the schedule.
1165          */
1166         for (i = 0; i < urb->number_of_packets; i++) {
1167                 struct ehci_iso_packet  *uframe = &iso_sched->packet [i];
1168                 unsigned                length;
1169                 dma_addr_t              buf;
1170                 u32                     trans;
1171
1172                 length = urb->iso_frame_desc [i].length;
1173                 buf = dma + urb->iso_frame_desc [i].offset;
1174
1175                 trans = EHCI_ISOC_ACTIVE;
1176                 trans |= buf & 0x0fff;
1177                 if (unlikely (((i + 1) == urb->number_of_packets))
1178                                 && !(urb->transfer_flags & URB_NO_INTERRUPT))
1179                         trans |= EHCI_ITD_IOC;
1180                 trans |= length << 16;
1181                 uframe->transaction = cpu_to_hc32(ehci, trans);
1182
1183                 /* might need to cross a buffer page within a uframe */
1184                 uframe->bufp = (buf & ~(u64)0x0fff);
1185                 buf += length;
1186                 if (unlikely ((uframe->bufp != (buf & ~(u64)0x0fff))))
1187                         uframe->cross = 1;
1188         }
1189 }
1190
1191 static void
1192 iso_sched_free (
1193         struct ehci_iso_stream  *stream,
1194         struct ehci_iso_sched   *iso_sched
1195 )
1196 {
1197         if (!iso_sched)
1198                 return;
1199         // caller must hold ehci->lock!
1200         list_splice (&iso_sched->td_list, &stream->free_list);
1201         kfree (iso_sched);
1202 }
1203
1204 static int
1205 itd_urb_transaction (
1206         struct ehci_iso_stream  *stream,
1207         struct ehci_hcd         *ehci,
1208         struct urb              *urb,
1209         gfp_t                   mem_flags
1210 )
1211 {
1212         struct ehci_itd         *itd;
1213         dma_addr_t              itd_dma;
1214         int                     i;
1215         unsigned                num_itds;
1216         struct ehci_iso_sched   *sched;
1217         unsigned long           flags;
1218
1219         sched = iso_sched_alloc (urb->number_of_packets, mem_flags);
1220         if (unlikely (sched == NULL))
1221                 return -ENOMEM;
1222
1223         itd_sched_init(ehci, sched, stream, urb);
1224
1225         if (urb->interval < 8)
1226                 num_itds = 1 + (sched->span + 7) / 8;
1227         else
1228                 num_itds = urb->number_of_packets;
1229
1230         /* allocate/init ITDs */
1231         spin_lock_irqsave (&ehci->lock, flags);
1232         for (i = 0; i < num_itds; i++) {
1233
1234                 /* free_list.next might be cache-hot ... but maybe
1235                  * the HC caches it too. avoid that issue for now.
1236                  */
1237
1238                 /* prefer previously-allocated itds */
1239                 if (likely (!list_empty(&stream->free_list))) {
1240                         itd = list_entry (stream->free_list.prev,
1241                                         struct ehci_itd, itd_list);
1242                         list_del (&itd->itd_list);
1243                         itd_dma = itd->itd_dma;
1244                 } else {
1245                         spin_unlock_irqrestore (&ehci->lock, flags);
1246                         itd = dma_pool_alloc (ehci->itd_pool, mem_flags,
1247                                         &itd_dma);
1248                         spin_lock_irqsave (&ehci->lock, flags);
1249                         if (!itd) {
1250                                 iso_sched_free(stream, sched);
1251                                 spin_unlock_irqrestore(&ehci->lock, flags);
1252                                 return -ENOMEM;
1253                         }
1254                 }
1255
1256                 memset (itd, 0, sizeof *itd);
1257                 itd->itd_dma = itd_dma;
1258                 list_add (&itd->itd_list, &sched->td_list);
1259         }
1260         spin_unlock_irqrestore (&ehci->lock, flags);
1261
1262         /* temporarily store schedule info in hcpriv */
1263         urb->hcpriv = sched;
1264         urb->error_count = 0;
1265         return 0;
1266 }
1267
1268 /*-------------------------------------------------------------------------*/
1269
1270 static inline int
1271 itd_slot_ok (
1272         struct ehci_hcd         *ehci,
1273         u32                     mod,
1274         u32                     uframe,
1275         u8                      usecs,
1276         u32                     period
1277 )
1278 {
1279         uframe %= period;
1280         do {
1281                 /* can't commit more than 80% periodic == 100 usec */
1282                 if (periodic_usecs (ehci, uframe >> 3, uframe & 0x7)
1283                                 > (100 - usecs))
1284                         return 0;
1285
1286                 /* we know urb->interval is 2^N uframes */
1287                 uframe += period;
1288         } while (uframe < mod);
1289         return 1;
1290 }
1291
1292 static inline int
1293 sitd_slot_ok (
1294         struct ehci_hcd         *ehci,
1295         u32                     mod,
1296         struct ehci_iso_stream  *stream,
1297         u32                     uframe,
1298         struct ehci_iso_sched   *sched,
1299         u32                     period_uframes
1300 )
1301 {
1302         u32                     mask, tmp;
1303         u32                     frame, uf;
1304
1305         mask = stream->raw_mask << (uframe & 7);
1306
1307         /* for IN, don't wrap CSPLIT into the next frame */
1308         if (mask & ~0xffff)
1309                 return 0;
1310
1311         /* this multi-pass logic is simple, but performance may
1312          * suffer when the schedule data isn't cached.
1313          */
1314
1315         /* check bandwidth */
1316         uframe %= period_uframes;
1317         do {
1318                 u32             max_used;
1319
1320                 frame = uframe >> 3;
1321                 uf = uframe & 7;
1322
1323 #ifdef CONFIG_USB_EHCI_TT_NEWSCHED
1324                 /* The tt's fullspeed bus bandwidth must be available.
1325                  * tt_available scheduling guarantees 10+% for control/bulk.
1326                  */
1327                 if (!tt_available (ehci, period_uframes << 3,
1328                                 stream->udev, frame, uf, stream->tt_usecs))
1329                         return 0;
1330 #else
1331                 /* tt must be idle for start(s), any gap, and csplit.
1332                  * assume scheduling slop leaves 10+% for control/bulk.
1333                  */
1334                 if (!tt_no_collision (ehci, period_uframes << 3,
1335                                 stream->udev, frame, mask))
1336                         return 0;
1337 #endif
1338
1339                 /* check starts (OUT uses more than one) */
1340                 max_used = 100 - stream->usecs;
1341                 for (tmp = stream->raw_mask & 0xff; tmp; tmp >>= 1, uf++) {
1342                         if (periodic_usecs (ehci, frame, uf) > max_used)
1343                                 return 0;
1344                 }
1345
1346                 /* for IN, check CSPLIT */
1347                 if (stream->c_usecs) {
1348                         uf = uframe & 7;
1349                         max_used = 100 - stream->c_usecs;
1350                         do {
1351                                 tmp = 1 << uf;
1352                                 tmp <<= 8;
1353                                 if ((stream->raw_mask & tmp) == 0)
1354                                         continue;
1355                                 if (periodic_usecs (ehci, frame, uf)
1356                                                 > max_used)
1357                                         return 0;
1358                         } while (++uf < 8);
1359                 }
1360
1361                 /* we know urb->interval is 2^N uframes */
1362                 uframe += period_uframes;
1363         } while (uframe < mod);
1364
1365         stream->splits = cpu_to_hc32(ehci, stream->raw_mask << (uframe & 7));
1366         return 1;
1367 }
1368
1369 /*
1370  * This scheduler plans almost as far into the future as it has actual
1371  * periodic schedule slots.  (Affected by TUNE_FLS, which defaults to
1372  * "as small as possible" to be cache-friendlier.)  That limits the size
1373  * transfers you can stream reliably; avoid more than 64 msec per urb.
1374  * Also avoid queue depths of less than ehci's worst irq latency (affected
1375  * by the per-urb URB_NO_INTERRUPT hint, the log2_irq_thresh module parameter,
1376  * and other factors); or more than about 230 msec total (for portability,
1377  * given EHCI_TUNE_FLS and the slop).  Or, write a smarter scheduler!
1378  */
1379
1380 #define SCHEDULE_SLOP   80      /* microframes */
1381
1382 static int
1383 iso_stream_schedule (
1384         struct ehci_hcd         *ehci,
1385         struct urb              *urb,
1386         struct ehci_iso_stream  *stream
1387 )
1388 {
1389         u32                     now, next, start, period, span;
1390         int                     status;
1391         unsigned                mod = ehci->periodic_size << 3;
1392         struct ehci_iso_sched   *sched = urb->hcpriv;
1393
1394         period = urb->interval;
1395         span = sched->span;
1396         if (!stream->highspeed) {
1397                 period <<= 3;
1398                 span <<= 3;
1399         }
1400
1401         if (span > mod - SCHEDULE_SLOP) {
1402                 ehci_dbg (ehci, "iso request %p too long\n", urb);
1403                 status = -EFBIG;
1404                 goto fail;
1405         }
1406
1407         now = ehci_readl(ehci, &ehci->regs->frame_index) & (mod - 1);
1408
1409         /* Typical case: reuse current schedule, stream is still active.
1410          * Hopefully there are no gaps from the host falling behind
1411          * (irq delays etc), but if there are we'll take the next
1412          * slot in the schedule, implicitly assuming URB_ISO_ASAP.
1413          */
1414         if (likely (!list_empty (&stream->td_list))) {
1415                 u32     excess;
1416
1417                 /* For high speed devices, allow scheduling within the
1418                  * isochronous scheduling threshold.  For full speed devices
1419                  * and Intel PCI-based controllers, don't (work around for
1420                  * Intel ICH9 bug).
1421                  */
1422                 if (!stream->highspeed && ehci->fs_i_thresh)
1423                         next = now + ehci->i_thresh;
1424                 else
1425                         next = now;
1426
1427                 /* Fell behind (by up to twice the slop amount)?
1428                  * We decide based on the time of the last currently-scheduled
1429                  * slot, not the time of the next available slot.
1430                  */
1431                 excess = (stream->next_uframe - period - next) & (mod - 1);
1432                 if (excess >= mod - 2 * SCHEDULE_SLOP)
1433                         start = next + excess - mod + period *
1434                                         DIV_ROUND_UP(mod - excess, period);
1435                 else
1436                         start = next + excess + period;
1437                 if (start - now >= mod) {
1438                         ehci_dbg(ehci, "request %p would overflow (%d+%d >= %d)\n",
1439                                         urb, start - now - period, period,
1440                                         mod);
1441                         status = -EFBIG;
1442                         goto fail;
1443                 }
1444         }
1445
1446         /* need to schedule; when's the next (u)frame we could start?
1447          * this is bigger than ehci->i_thresh allows; scheduling itself
1448          * isn't free, the slop should handle reasonably slow cpus.  it
1449          * can also help high bandwidth if the dma and irq loads don't
1450          * jump until after the queue is primed.
1451          */
1452         else {
1453                 start = SCHEDULE_SLOP + (now & ~0x07);
1454
1455                 /* NOTE:  assumes URB_ISO_ASAP, to limit complexity/bugs */
1456
1457                 /* find a uframe slot with enough bandwidth */
1458                 next = start + period;
1459                 for (; start < next; start++) {
1460
1461                         /* check schedule: enough space? */
1462                         if (stream->highspeed) {
1463                                 if (itd_slot_ok(ehci, mod, start,
1464                                                 stream->usecs, period))
1465                                         break;
1466                         } else {
1467                                 if ((start % 8) >= 6)
1468                                         continue;
1469                                 if (sitd_slot_ok(ehci, mod, stream,
1470                                                 start, sched, period))
1471                                         break;
1472                         }
1473                 }
1474
1475                 /* no room in the schedule */
1476                 if (start == next) {
1477                         ehci_dbg(ehci, "iso resched full %p (now %d max %d)\n",
1478                                 urb, now, now + mod);
1479                         status = -ENOSPC;
1480                         goto fail;
1481                 }
1482         }
1483
1484         /* Tried to schedule too far into the future? */
1485         if (unlikely(start - now + span - period
1486                                 >= mod - 2 * SCHEDULE_SLOP)) {
1487                 ehci_dbg(ehci, "request %p would overflow (%d+%d >= %d)\n",
1488                                 urb, start - now, span - period,
1489                                 mod - 2 * SCHEDULE_SLOP);
1490                 status = -EFBIG;
1491                 goto fail;
1492         }
1493
1494         stream->next_uframe = start & (mod - 1);
1495
1496         /* report high speed start in uframes; full speed, in frames */
1497         urb->start_frame = stream->next_uframe;
1498         if (!stream->highspeed)
1499                 urb->start_frame >>= 3;
1500         return 0;
1501
1502  fail:
1503         iso_sched_free(stream, sched);
1504         urb->hcpriv = NULL;
1505         return status;
1506 }
1507
1508 /*-------------------------------------------------------------------------*/
1509
1510 static inline void
1511 itd_init(struct ehci_hcd *ehci, struct ehci_iso_stream *stream,
1512                 struct ehci_itd *itd)
1513 {
1514         int i;
1515
1516         /* it's been recently zeroed */
1517         itd->hw_next = EHCI_LIST_END(ehci);
1518         itd->hw_bufp [0] = stream->buf0;
1519         itd->hw_bufp [1] = stream->buf1;
1520         itd->hw_bufp [2] = stream->buf2;
1521
1522         for (i = 0; i < 8; i++)
1523                 itd->index[i] = -1;
1524
1525         /* All other fields are filled when scheduling */
1526 }
1527
1528 static inline void
1529 itd_patch(
1530         struct ehci_hcd         *ehci,
1531         struct ehci_itd         *itd,
1532         struct ehci_iso_sched   *iso_sched,
1533         unsigned                index,
1534         u16                     uframe
1535 )
1536 {
1537         struct ehci_iso_packet  *uf = &iso_sched->packet [index];
1538         unsigned                pg = itd->pg;
1539
1540         // BUG_ON (pg == 6 && uf->cross);
1541
1542         uframe &= 0x07;
1543         itd->index [uframe] = index;
1544
1545         itd->hw_transaction[uframe] = uf->transaction;
1546         itd->hw_transaction[uframe] |= cpu_to_hc32(ehci, pg << 12);
1547         itd->hw_bufp[pg] |= cpu_to_hc32(ehci, uf->bufp & ~(u32)0);
1548         itd->hw_bufp_hi[pg] |= cpu_to_hc32(ehci, (u32)(uf->bufp >> 32));
1549
1550         /* iso_frame_desc[].offset must be strictly increasing */
1551         if (unlikely (uf->cross)) {
1552                 u64     bufp = uf->bufp + 4096;
1553
1554                 itd->pg = ++pg;
1555                 itd->hw_bufp[pg] |= cpu_to_hc32(ehci, bufp & ~(u32)0);
1556                 itd->hw_bufp_hi[pg] |= cpu_to_hc32(ehci, (u32)(bufp >> 32));
1557         }
1558 }
1559
1560 static inline void
1561 itd_link (struct ehci_hcd *ehci, unsigned frame, struct ehci_itd *itd)
1562 {
1563         union ehci_shadow       *prev = &ehci->pshadow[frame];
1564         __hc32                  *hw_p = &ehci->periodic[frame];
1565         union ehci_shadow       here = *prev;
1566         __hc32                  type = 0;
1567
1568         /* skip any iso nodes which might belong to previous microframes */
1569         while (here.ptr) {
1570                 type = Q_NEXT_TYPE(ehci, *hw_p);
1571                 if (type == cpu_to_hc32(ehci, Q_TYPE_QH))
1572                         break;
1573                 prev = periodic_next_shadow(ehci, prev, type);
1574                 hw_p = shadow_next_periodic(ehci, &here, type);
1575                 here = *prev;
1576         }
1577
1578         itd->itd_next = here;
1579         itd->hw_next = *hw_p;
1580         prev->itd = itd;
1581         itd->frame = frame;
1582         wmb ();
1583         *hw_p = cpu_to_hc32(ehci, itd->itd_dma | Q_TYPE_ITD);
1584 }
1585
1586 /* fit urb's itds into the selected schedule slot; activate as needed */
1587 static int
1588 itd_link_urb (
1589         struct ehci_hcd         *ehci,
1590         struct urb              *urb,
1591         unsigned                mod,
1592         struct ehci_iso_stream  *stream
1593 )
1594 {
1595         int                     packet;
1596         unsigned                next_uframe, uframe, frame;
1597         struct ehci_iso_sched   *iso_sched = urb->hcpriv;
1598         struct ehci_itd         *itd;
1599
1600         next_uframe = stream->next_uframe & (mod - 1);
1601
1602         if (unlikely (list_empty(&stream->td_list))) {
1603                 ehci_to_hcd(ehci)->self.bandwidth_allocated
1604                                 += stream->bandwidth;
1605                 ehci_vdbg (ehci,
1606                         "schedule devp %s ep%d%s-iso period %d start %d.%d\n",
1607                         urb->dev->devpath, stream->bEndpointAddress & 0x0f,
1608                         (stream->bEndpointAddress & USB_DIR_IN) ? "in" : "out",
1609                         urb->interval,
1610                         next_uframe >> 3, next_uframe & 0x7);
1611         }
1612         ehci_to_hcd(ehci)->self.bandwidth_isoc_reqs++;
1613
1614         /* fill iTDs uframe by uframe */
1615         for (packet = 0, itd = NULL; packet < urb->number_of_packets; ) {
1616                 if (itd == NULL) {
1617                         /* ASSERT:  we have all necessary itds */
1618                         // BUG_ON (list_empty (&iso_sched->td_list));
1619
1620                         /* ASSERT:  no itds for this endpoint in this uframe */
1621
1622                         itd = list_entry (iso_sched->td_list.next,
1623                                         struct ehci_itd, itd_list);
1624                         list_move_tail (&itd->itd_list, &stream->td_list);
1625                         itd->stream = iso_stream_get (stream);
1626                         itd->urb = urb;
1627                         itd_init (ehci, stream, itd);
1628                 }
1629
1630                 uframe = next_uframe & 0x07;
1631                 frame = next_uframe >> 3;
1632
1633                 itd_patch(ehci, itd, iso_sched, packet, uframe);
1634
1635                 next_uframe += stream->interval;
1636                 next_uframe &= mod - 1;
1637                 packet++;
1638
1639                 /* link completed itds into the schedule */
1640                 if (((next_uframe >> 3) != frame)
1641                                 || packet == urb->number_of_packets) {
1642                         itd_link(ehci, frame & (ehci->periodic_size - 1), itd);
1643                         itd = NULL;
1644                 }
1645         }
1646         stream->next_uframe = next_uframe;
1647
1648         /* don't need that schedule data any more */
1649         iso_sched_free (stream, iso_sched);
1650         urb->hcpriv = NULL;
1651
1652         timer_action (ehci, TIMER_IO_WATCHDOG);
1653         return enable_periodic(ehci);
1654 }
1655
1656 #define ISO_ERRS (EHCI_ISOC_BUF_ERR | EHCI_ISOC_BABBLE | EHCI_ISOC_XACTERR)
1657
1658 /* Process and recycle a completed ITD.  Return true iff its urb completed,
1659  * and hence its completion callback probably added things to the hardware
1660  * schedule.
1661  *
1662  * Note that we carefully avoid recycling this descriptor until after any
1663  * completion callback runs, so that it won't be reused quickly.  That is,
1664  * assuming (a) no more than two urbs per frame on this endpoint, and also
1665  * (b) only this endpoint's completions submit URBs.  It seems some silicon
1666  * corrupts things if you reuse completed descriptors very quickly...
1667  */
1668 static unsigned
1669 itd_complete (
1670         struct ehci_hcd *ehci,
1671         struct ehci_itd *itd
1672 ) {
1673         struct urb                              *urb = itd->urb;
1674         struct usb_iso_packet_descriptor        *desc;
1675         u32                                     t;
1676         unsigned                                uframe;
1677         int                                     urb_index = -1;
1678         struct ehci_iso_stream                  *stream = itd->stream;
1679         struct usb_device                       *dev;
1680         unsigned                                retval = false;
1681
1682         /* for each uframe with a packet */
1683         for (uframe = 0; uframe < 8; uframe++) {
1684                 if (likely (itd->index[uframe] == -1))
1685                         continue;
1686                 urb_index = itd->index[uframe];
1687                 desc = &urb->iso_frame_desc [urb_index];
1688
1689                 t = hc32_to_cpup(ehci, &itd->hw_transaction [uframe]);
1690                 itd->hw_transaction [uframe] = 0;
1691
1692                 /* report transfer status */
1693                 if (unlikely (t & ISO_ERRS)) {
1694                         urb->error_count++;
1695                         if (t & EHCI_ISOC_BUF_ERR)
1696                                 desc->status = usb_pipein (urb->pipe)
1697                                         ? -ENOSR  /* hc couldn't read */
1698                                         : -ECOMM; /* hc couldn't write */
1699                         else if (t & EHCI_ISOC_BABBLE)
1700                                 desc->status = -EOVERFLOW;
1701                         else /* (t & EHCI_ISOC_XACTERR) */
1702                                 desc->status = -EPROTO;
1703
1704                         /* HC need not update length with this error */
1705                         if (!(t & EHCI_ISOC_BABBLE)) {
1706                                 desc->actual_length = EHCI_ITD_LENGTH(t);
1707                                 urb->actual_length += desc->actual_length;
1708                         }
1709                 } else if (likely ((t & EHCI_ISOC_ACTIVE) == 0)) {
1710                         desc->status = 0;
1711                         desc->actual_length = EHCI_ITD_LENGTH(t);
1712                         urb->actual_length += desc->actual_length;
1713                 } else {
1714                         /* URB was too late */
1715                         desc->status = -EXDEV;
1716                 }
1717         }
1718
1719         /* handle completion now? */
1720         if (likely ((urb_index + 1) != urb->number_of_packets))
1721                 goto done;
1722
1723         /* ASSERT: it's really the last itd for this urb
1724         list_for_each_entry (itd, &stream->td_list, itd_list)
1725                 BUG_ON (itd->urb == urb);
1726          */
1727
1728         /* give urb back to the driver; completion often (re)submits */
1729         dev = urb->dev;
1730         ehci_urb_done(ehci, urb, 0);
1731         retval = true;
1732         urb = NULL;
1733         (void) disable_periodic(ehci);
1734         ehci_to_hcd(ehci)->self.bandwidth_isoc_reqs--;
1735
1736         if (unlikely(list_is_singular(&stream->td_list))) {
1737                 ehci_to_hcd(ehci)->self.bandwidth_allocated
1738                                 -= stream->bandwidth;
1739                 ehci_vdbg (ehci,
1740                         "deschedule devp %s ep%d%s-iso\n",
1741                         dev->devpath, stream->bEndpointAddress & 0x0f,
1742                         (stream->bEndpointAddress & USB_DIR_IN) ? "in" : "out");
1743         }
1744         iso_stream_put (ehci, stream);
1745
1746 done:
1747         itd->urb = NULL;
1748         if (ehci->clock_frame != itd->frame || itd->index[7] != -1) {
1749                 /* OK to recycle this ITD now. */
1750                 itd->stream = NULL;
1751                 list_move(&itd->itd_list, &stream->free_list);
1752                 iso_stream_put(ehci, stream);
1753         } else {
1754                 /* HW might remember this ITD, so we can't recycle it yet.
1755                  * Move it to a safe place until a new frame starts.
1756                  */
1757                 list_move(&itd->itd_list, &ehci->cached_itd_list);
1758                 if (stream->refcount == 2) {
1759                         /* If iso_stream_put() were called here, stream
1760                          * would be freed.  Instead, just prevent reuse.
1761                          */
1762                         stream->ep->hcpriv = NULL;
1763                         stream->ep = NULL;
1764                 }
1765         }
1766         return retval;
1767 }
1768
1769 /*-------------------------------------------------------------------------*/
1770
1771 static int itd_submit (struct ehci_hcd *ehci, struct urb *urb,
1772         gfp_t mem_flags)
1773 {
1774         int                     status = -EINVAL;
1775         unsigned long           flags;
1776         struct ehci_iso_stream  *stream;
1777
1778         /* Get iso_stream head */
1779         stream = iso_stream_find (ehci, urb);
1780         if (unlikely (stream == NULL)) {
1781                 ehci_dbg (ehci, "can't get iso stream\n");
1782                 return -ENOMEM;
1783         }
1784         if (unlikely (urb->interval != stream->interval)) {
1785                 ehci_dbg (ehci, "can't change iso interval %d --> %d\n",
1786                         stream->interval, urb->interval);
1787                 goto done;
1788         }
1789
1790 #ifdef EHCI_URB_TRACE
1791         ehci_dbg (ehci,
1792                 "%s %s urb %p ep%d%s len %d, %d pkts %d uframes [%p]\n",
1793                 __func__, urb->dev->devpath, urb,
1794                 usb_pipeendpoint (urb->pipe),
1795                 usb_pipein (urb->pipe) ? "in" : "out",
1796                 urb->transfer_buffer_length,
1797                 urb->number_of_packets, urb->interval,
1798                 stream);
1799 #endif
1800
1801         /* allocate ITDs w/o locking anything */
1802         status = itd_urb_transaction (stream, ehci, urb, mem_flags);
1803         if (unlikely (status < 0)) {
1804                 ehci_dbg (ehci, "can't init itds\n");
1805                 goto done;
1806         }
1807
1808         /* schedule ... need to lock */
1809         spin_lock_irqsave (&ehci->lock, flags);
1810         if (unlikely(!HCD_HW_ACCESSIBLE(ehci_to_hcd(ehci)))) {
1811                 status = -ESHUTDOWN;
1812                 goto done_not_linked;
1813         }
1814         status = usb_hcd_link_urb_to_ep(ehci_to_hcd(ehci), urb);
1815         if (unlikely(status))
1816                 goto done_not_linked;
1817         status = iso_stream_schedule(ehci, urb, stream);
1818         if (likely (status == 0))
1819                 itd_link_urb (ehci, urb, ehci->periodic_size << 3, stream);
1820         else
1821                 usb_hcd_unlink_urb_from_ep(ehci_to_hcd(ehci), urb);
1822 done_not_linked:
1823         spin_unlock_irqrestore (&ehci->lock, flags);
1824
1825 done:
1826         if (unlikely (status < 0))
1827                 iso_stream_put (ehci, stream);
1828         return status;
1829 }
1830
1831 /*-------------------------------------------------------------------------*/
1832
1833 /*
1834  * "Split ISO TDs" ... used for USB 1.1 devices going through the
1835  * TTs in USB 2.0 hubs.  These need microframe scheduling.
1836  */
1837
1838 static inline void
1839 sitd_sched_init(
1840         struct ehci_hcd         *ehci,
1841         struct ehci_iso_sched   *iso_sched,
1842         struct ehci_iso_stream  *stream,
1843         struct urb              *urb
1844 )
1845 {
1846         unsigned        i;
1847         dma_addr_t      dma = urb->transfer_dma;
1848
1849         /* how many frames are needed for these transfers */
1850         iso_sched->span = urb->number_of_packets * stream->interval;
1851
1852         /* figure out per-frame sitd fields that we'll need later
1853          * when we fit new sitds into the schedule.
1854          */
1855         for (i = 0; i < urb->number_of_packets; i++) {
1856                 struct ehci_iso_packet  *packet = &iso_sched->packet [i];
1857                 unsigned                length;
1858                 dma_addr_t              buf;
1859                 u32                     trans;
1860
1861                 length = urb->iso_frame_desc [i].length & 0x03ff;
1862                 buf = dma + urb->iso_frame_desc [i].offset;
1863
1864                 trans = SITD_STS_ACTIVE;
1865                 if (((i + 1) == urb->number_of_packets)
1866                                 && !(urb->transfer_flags & URB_NO_INTERRUPT))
1867                         trans |= SITD_IOC;
1868                 trans |= length << 16;
1869                 packet->transaction = cpu_to_hc32(ehci, trans);
1870
1871                 /* might need to cross a buffer page within a td */
1872                 packet->bufp = buf;
1873                 packet->buf1 = (buf + length) & ~0x0fff;
1874                 if (packet->buf1 != (buf & ~(u64)0x0fff))
1875                         packet->cross = 1;
1876
1877                 /* OUT uses multiple start-splits */
1878                 if (stream->bEndpointAddress & USB_DIR_IN)
1879                         continue;
1880                 length = (length + 187) / 188;
1881                 if (length > 1) /* BEGIN vs ALL */
1882                         length |= 1 << 3;
1883                 packet->buf1 |= length;
1884         }
1885 }
1886
1887 static int
1888 sitd_urb_transaction (
1889         struct ehci_iso_stream  *stream,
1890         struct ehci_hcd         *ehci,
1891         struct urb              *urb,
1892         gfp_t                   mem_flags
1893 )
1894 {
1895         struct ehci_sitd        *sitd;
1896         dma_addr_t              sitd_dma;
1897         int                     i;
1898         struct ehci_iso_sched   *iso_sched;
1899         unsigned long           flags;
1900
1901         iso_sched = iso_sched_alloc (urb->number_of_packets, mem_flags);
1902         if (iso_sched == NULL)
1903                 return -ENOMEM;
1904
1905         sitd_sched_init(ehci, iso_sched, stream, urb);
1906
1907         /* allocate/init sITDs */
1908         spin_lock_irqsave (&ehci->lock, flags);
1909         for (i = 0; i < urb->number_of_packets; i++) {
1910
1911                 /* NOTE:  for now, we don't try to handle wraparound cases
1912                  * for IN (using sitd->hw_backpointer, like a FSTN), which
1913                  * means we never need two sitds for full speed packets.
1914                  */
1915
1916                 /* free_list.next might be cache-hot ... but maybe
1917                  * the HC caches it too. avoid that issue for now.
1918                  */
1919
1920                 /* prefer previously-allocated sitds */
1921                 if (!list_empty(&stream->free_list)) {
1922                         sitd = list_entry (stream->free_list.prev,
1923                                          struct ehci_sitd, sitd_list);
1924                         list_del (&sitd->sitd_list);
1925                         sitd_dma = sitd->sitd_dma;
1926                 } else {
1927                         spin_unlock_irqrestore (&ehci->lock, flags);
1928                         sitd = dma_pool_alloc (ehci->sitd_pool, mem_flags,
1929                                         &sitd_dma);
1930                         spin_lock_irqsave (&ehci->lock, flags);
1931                         if (!sitd) {
1932                                 iso_sched_free(stream, iso_sched);
1933                                 spin_unlock_irqrestore(&ehci->lock, flags);
1934                                 return -ENOMEM;
1935                         }
1936                 }
1937
1938                 memset (sitd, 0, sizeof *sitd);
1939                 sitd->sitd_dma = sitd_dma;
1940                 list_add (&sitd->sitd_list, &iso_sched->td_list);
1941         }
1942
1943         /* temporarily store schedule info in hcpriv */
1944         urb->hcpriv = iso_sched;
1945         urb->error_count = 0;
1946
1947         spin_unlock_irqrestore (&ehci->lock, flags);
1948         return 0;
1949 }
1950
1951 /*-------------------------------------------------------------------------*/
1952
1953 static inline void
1954 sitd_patch(
1955         struct ehci_hcd         *ehci,
1956         struct ehci_iso_stream  *stream,
1957         struct ehci_sitd        *sitd,
1958         struct ehci_iso_sched   *iso_sched,
1959         unsigned                index
1960 )
1961 {
1962         struct ehci_iso_packet  *uf = &iso_sched->packet [index];
1963         u64                     bufp = uf->bufp;
1964
1965         sitd->hw_next = EHCI_LIST_END(ehci);
1966         sitd->hw_fullspeed_ep = stream->address;
1967         sitd->hw_uframe = stream->splits;
1968         sitd->hw_results = uf->transaction;
1969         sitd->hw_backpointer = EHCI_LIST_END(ehci);
1970
1971         bufp = uf->bufp;
1972         sitd->hw_buf[0] = cpu_to_hc32(ehci, bufp);
1973         sitd->hw_buf_hi[0] = cpu_to_hc32(ehci, bufp >> 32);
1974
1975         sitd->hw_buf[1] = cpu_to_hc32(ehci, uf->buf1);
1976         if (uf->cross)
1977                 bufp += 4096;
1978         sitd->hw_buf_hi[1] = cpu_to_hc32(ehci, bufp >> 32);
1979         sitd->index = index;
1980 }
1981
1982 static inline void
1983 sitd_link (struct ehci_hcd *ehci, unsigned frame, struct ehci_sitd *sitd)
1984 {
1985         /* note: sitd ordering could matter (CSPLIT then SSPLIT) */
1986         sitd->sitd_next = ehci->pshadow [frame];
1987         sitd->hw_next = ehci->periodic [frame];
1988         ehci->pshadow [frame].sitd = sitd;
1989         sitd->frame = frame;
1990         wmb ();
1991         ehci->periodic[frame] = cpu_to_hc32(ehci, sitd->sitd_dma | Q_TYPE_SITD);
1992 }
1993
1994 /* fit urb's sitds into the selected schedule slot; activate as needed */
1995 static int
1996 sitd_link_urb (
1997         struct ehci_hcd         *ehci,
1998         struct urb              *urb,
1999         unsigned                mod,
2000         struct ehci_iso_stream  *stream
2001 )
2002 {
2003         int                     packet;
2004         unsigned                next_uframe;
2005         struct ehci_iso_sched   *sched = urb->hcpriv;
2006         struct ehci_sitd        *sitd;
2007
2008         next_uframe = stream->next_uframe;
2009
2010         if (list_empty(&stream->td_list)) {
2011                 /* usbfs ignores TT bandwidth */
2012                 ehci_to_hcd(ehci)->self.bandwidth_allocated
2013                                 += stream->bandwidth;
2014                 ehci_vdbg (ehci,
2015                         "sched devp %s ep%d%s-iso [%d] %dms/%04x\n",
2016                         urb->dev->devpath, stream->bEndpointAddress & 0x0f,
2017                         (stream->bEndpointAddress & USB_DIR_IN) ? "in" : "out",
2018                         (next_uframe >> 3) & (ehci->periodic_size - 1),
2019                         stream->interval, hc32_to_cpu(ehci, stream->splits));
2020         }
2021         ehci_to_hcd(ehci)->self.bandwidth_isoc_reqs++;
2022
2023         /* fill sITDs frame by frame */
2024         for (packet = 0, sitd = NULL;
2025                         packet < urb->number_of_packets;
2026                         packet++) {
2027
2028                 /* ASSERT:  we have all necessary sitds */
2029                 BUG_ON (list_empty (&sched->td_list));
2030
2031                 /* ASSERT:  no itds for this endpoint in this frame */
2032
2033                 sitd = list_entry (sched->td_list.next,
2034                                 struct ehci_sitd, sitd_list);
2035                 list_move_tail (&sitd->sitd_list, &stream->td_list);
2036                 sitd->stream = iso_stream_get (stream);
2037                 sitd->urb = urb;
2038
2039                 sitd_patch(ehci, stream, sitd, sched, packet);
2040                 sitd_link(ehci, (next_uframe >> 3) & (ehci->periodic_size - 1),
2041                                 sitd);
2042
2043                 next_uframe += stream->interval << 3;
2044         }
2045         stream->next_uframe = next_uframe & (mod - 1);
2046
2047         /* don't need that schedule data any more */
2048         iso_sched_free (stream, sched);
2049         urb->hcpriv = NULL;
2050
2051         timer_action (ehci, TIMER_IO_WATCHDOG);
2052         return enable_periodic(ehci);
2053 }
2054
2055 /*-------------------------------------------------------------------------*/
2056
2057 #define SITD_ERRS (SITD_STS_ERR | SITD_STS_DBE | SITD_STS_BABBLE \
2058                                 | SITD_STS_XACT | SITD_STS_MMF)
2059
2060 /* Process and recycle a completed SITD.  Return true iff its urb completed,
2061  * and hence its completion callback probably added things to the hardware
2062  * schedule.
2063  *
2064  * Note that we carefully avoid recycling this descriptor until after any
2065  * completion callback runs, so that it won't be reused quickly.  That is,
2066  * assuming (a) no more than two urbs per frame on this endpoint, and also
2067  * (b) only this endpoint's completions submit URBs.  It seems some silicon
2068  * corrupts things if you reuse completed descriptors very quickly...
2069  */
2070 static unsigned
2071 sitd_complete (
2072         struct ehci_hcd         *ehci,
2073         struct ehci_sitd        *sitd
2074 ) {
2075         struct urb                              *urb = sitd->urb;
2076         struct usb_iso_packet_descriptor        *desc;
2077         u32                                     t;
2078         int                                     urb_index = -1;
2079         struct ehci_iso_stream                  *stream = sitd->stream;
2080         struct usb_device                       *dev;
2081         unsigned                                retval = false;
2082
2083         urb_index = sitd->index;
2084         desc = &urb->iso_frame_desc [urb_index];
2085         t = hc32_to_cpup(ehci, &sitd->hw_results);
2086
2087         /* report transfer status */
2088         if (t & SITD_ERRS) {
2089                 urb->error_count++;
2090                 if (t & SITD_STS_DBE)
2091                         desc->status = usb_pipein (urb->pipe)
2092                                 ? -ENOSR  /* hc couldn't read */
2093                                 : -ECOMM; /* hc couldn't write */
2094                 else if (t & SITD_STS_BABBLE)
2095                         desc->status = -EOVERFLOW;
2096                 else /* XACT, MMF, etc */
2097                         desc->status = -EPROTO;
2098         } else {
2099                 desc->status = 0;
2100                 desc->actual_length = desc->length - SITD_LENGTH(t);
2101                 urb->actual_length += desc->actual_length;
2102         }
2103
2104         /* handle completion now? */
2105         if ((urb_index + 1) != urb->number_of_packets)
2106                 goto done;
2107
2108         /* ASSERT: it's really the last sitd for this urb
2109         list_for_each_entry (sitd, &stream->td_list, sitd_list)
2110                 BUG_ON (sitd->urb == urb);
2111          */
2112
2113         /* give urb back to the driver; completion often (re)submits */
2114         dev = urb->dev;
2115         ehci_urb_done(ehci, urb, 0);
2116         retval = true;
2117         urb = NULL;
2118         (void) disable_periodic(ehci);
2119         ehci_to_hcd(ehci)->self.bandwidth_isoc_reqs--;
2120
2121         if (list_is_singular(&stream->td_list)) {
2122                 ehci_to_hcd(ehci)->self.bandwidth_allocated
2123                                 -= stream->bandwidth;
2124                 ehci_vdbg (ehci,
2125                         "deschedule devp %s ep%d%s-iso\n",
2126                         dev->devpath, stream->bEndpointAddress & 0x0f,
2127                         (stream->bEndpointAddress & USB_DIR_IN) ? "in" : "out");
2128         }
2129         iso_stream_put (ehci, stream);
2130
2131 done:
2132         sitd->urb = NULL;
2133         if (ehci->clock_frame != sitd->frame) {
2134                 /* OK to recycle this SITD now. */
2135                 sitd->stream = NULL;
2136                 list_move(&sitd->sitd_list, &stream->free_list);
2137                 iso_stream_put(ehci, stream);
2138         } else {
2139                 /* HW might remember this SITD, so we can't recycle it yet.
2140                  * Move it to a safe place until a new frame starts.
2141                  */
2142                 list_move(&sitd->sitd_list, &ehci->cached_sitd_list);
2143                 if (stream->refcount == 2) {
2144                         /* If iso_stream_put() were called here, stream
2145                          * would be freed.  Instead, just prevent reuse.
2146                          */
2147                         stream->ep->hcpriv = NULL;
2148                         stream->ep = NULL;
2149                 }
2150         }
2151         return retval;
2152 }
2153
2154
2155 static int sitd_submit (struct ehci_hcd *ehci, struct urb *urb,
2156         gfp_t mem_flags)
2157 {
2158         int                     status = -EINVAL;
2159         unsigned long           flags;
2160         struct ehci_iso_stream  *stream;
2161
2162         /* Get iso_stream head */
2163         stream = iso_stream_find (ehci, urb);
2164         if (stream == NULL) {
2165                 ehci_dbg (ehci, "can't get iso stream\n");
2166                 return -ENOMEM;
2167         }
2168         if (urb->interval != stream->interval) {
2169                 ehci_dbg (ehci, "can't change iso interval %d --> %d\n",
2170                         stream->interval, urb->interval);
2171                 goto done;
2172         }
2173
2174 #ifdef EHCI_URB_TRACE
2175         ehci_dbg (ehci,
2176                 "submit %p dev%s ep%d%s-iso len %d\n",
2177                 urb, urb->dev->devpath,
2178                 usb_pipeendpoint (urb->pipe),
2179                 usb_pipein (urb->pipe) ? "in" : "out",
2180                 urb->transfer_buffer_length);
2181 #endif
2182
2183         /* allocate SITDs */
2184         status = sitd_urb_transaction (stream, ehci, urb, mem_flags);
2185         if (status < 0) {
2186                 ehci_dbg (ehci, "can't init sitds\n");
2187                 goto done;
2188         }
2189
2190         /* schedule ... need to lock */
2191         spin_lock_irqsave (&ehci->lock, flags);
2192         if (unlikely(!HCD_HW_ACCESSIBLE(ehci_to_hcd(ehci)))) {
2193                 status = -ESHUTDOWN;
2194                 goto done_not_linked;
2195         }
2196         status = usb_hcd_link_urb_to_ep(ehci_to_hcd(ehci), urb);
2197         if (unlikely(status))
2198                 goto done_not_linked;
2199         status = iso_stream_schedule(ehci, urb, stream);
2200         if (status == 0)
2201                 sitd_link_urb (ehci, urb, ehci->periodic_size << 3, stream);
2202         else
2203                 usb_hcd_unlink_urb_from_ep(ehci_to_hcd(ehci), urb);
2204 done_not_linked:
2205         spin_unlock_irqrestore (&ehci->lock, flags);
2206
2207 done:
2208         if (status < 0)
2209                 iso_stream_put (ehci, stream);
2210         return status;
2211 }
2212
2213 /*-------------------------------------------------------------------------*/
2214
2215 static void free_cached_lists(struct ehci_hcd *ehci)
2216 {
2217         struct ehci_itd *itd, *n;
2218         struct ehci_sitd *sitd, *sn;
2219
2220         list_for_each_entry_safe(itd, n, &ehci->cached_itd_list, itd_list) {
2221                 struct ehci_iso_stream  *stream = itd->stream;
2222                 itd->stream = NULL;
2223                 list_move(&itd->itd_list, &stream->free_list);
2224                 iso_stream_put(ehci, stream);
2225         }
2226
2227         list_for_each_entry_safe(sitd, sn, &ehci->cached_sitd_list, sitd_list) {
2228                 struct ehci_iso_stream  *stream = sitd->stream;
2229                 sitd->stream = NULL;
2230                 list_move(&sitd->sitd_list, &stream->free_list);
2231                 iso_stream_put(ehci, stream);
2232         }
2233 }
2234
2235 /*-------------------------------------------------------------------------*/
2236
2237 static void
2238 scan_periodic (struct ehci_hcd *ehci)
2239 {
2240         unsigned        now_uframe, frame, clock, clock_frame, mod;
2241         unsigned        modified;
2242
2243         mod = ehci->periodic_size << 3;
2244
2245         /*
2246          * When running, scan from last scan point up to "now"
2247          * else clean up by scanning everything that's left.
2248          * Touches as few pages as possible:  cache-friendly.
2249          */
2250         now_uframe = ehci->next_uframe;
2251         if (HC_IS_RUNNING(ehci_to_hcd(ehci)->state)) {
2252                 clock = ehci_readl(ehci, &ehci->regs->frame_index);
2253                 clock_frame = (clock >> 3) & (ehci->periodic_size - 1);
2254         } else  {
2255                 clock = now_uframe + mod - 1;
2256                 clock_frame = -1;
2257         }
2258         if (ehci->clock_frame != clock_frame) {
2259                 free_cached_lists(ehci);
2260                 ehci->clock_frame = clock_frame;
2261         }
2262         clock &= mod - 1;
2263         clock_frame = clock >> 3;
2264
2265         for (;;) {
2266                 union ehci_shadow       q, *q_p;
2267                 __hc32                  type, *hw_p;
2268                 unsigned                incomplete = false;
2269
2270                 frame = now_uframe >> 3;
2271
2272 restart:
2273                 /* scan each element in frame's queue for completions */
2274                 q_p = &ehci->pshadow [frame];
2275                 hw_p = &ehci->periodic [frame];
2276                 q.ptr = q_p->ptr;
2277                 type = Q_NEXT_TYPE(ehci, *hw_p);
2278                 modified = 0;
2279
2280                 while (q.ptr != NULL) {
2281                         unsigned                uf;
2282                         union ehci_shadow       temp;
2283                         int                     live;
2284
2285                         live = HC_IS_RUNNING (ehci_to_hcd(ehci)->state);
2286                         switch (hc32_to_cpu(ehci, type)) {
2287                         case Q_TYPE_QH:
2288                                 /* handle any completions */
2289                                 temp.qh = qh_get (q.qh);
2290                                 type = Q_NEXT_TYPE(ehci, q.qh->hw->hw_next);
2291                                 q = q.qh->qh_next;
2292                                 modified = qh_completions (ehci, temp.qh);
2293                                 if (unlikely(list_empty(&temp.qh->qtd_list) ||
2294                                                 temp.qh->needs_rescan))
2295                                         intr_deschedule (ehci, temp.qh);
2296                                 qh_put (temp.qh);
2297                                 break;
2298                         case Q_TYPE_FSTN:
2299                                 /* for "save place" FSTNs, look at QH entries
2300                                  * in the previous frame for completions.
2301                                  */
2302                                 if (q.fstn->hw_prev != EHCI_LIST_END(ehci)) {
2303                                         dbg ("ignoring completions from FSTNs");
2304                                 }
2305                                 type = Q_NEXT_TYPE(ehci, q.fstn->hw_next);
2306                                 q = q.fstn->fstn_next;
2307                                 break;
2308                         case Q_TYPE_ITD:
2309                                 /* If this ITD is still active, leave it for
2310                                  * later processing ... check the next entry.
2311                                  * No need to check for activity unless the
2312                                  * frame is current.
2313                                  */
2314                                 if (frame == clock_frame && live) {
2315                                         rmb();
2316                                         for (uf = 0; uf < 8; uf++) {
2317                                                 if (q.itd->hw_transaction[uf] &
2318                                                             ITD_ACTIVE(ehci))
2319                                                         break;
2320                                         }
2321                                         if (uf < 8) {
2322                                                 incomplete = true;
2323                                                 q_p = &q.itd->itd_next;
2324                                                 hw_p = &q.itd->hw_next;
2325                                                 type = Q_NEXT_TYPE(ehci,
2326                                                         q.itd->hw_next);
2327                                                 q = *q_p;
2328                                                 break;
2329                                         }
2330                                 }
2331
2332                                 /* Take finished ITDs out of the schedule
2333                                  * and process them:  recycle, maybe report
2334                                  * URB completion.  HC won't cache the
2335                                  * pointer for much longer, if at all.
2336                                  */
2337                                 *q_p = q.itd->itd_next;
2338                                 *hw_p = q.itd->hw_next;
2339                                 type = Q_NEXT_TYPE(ehci, q.itd->hw_next);
2340                                 wmb();
2341                                 modified = itd_complete (ehci, q.itd);
2342                                 q = *q_p;
2343                                 break;
2344                         case Q_TYPE_SITD:
2345                                 /* If this SITD is still active, leave it for
2346                                  * later processing ... check the next entry.
2347                                  * No need to check for activity unless the
2348                                  * frame is current.
2349                                  */
2350                                 if (((frame == clock_frame) ||
2351                                      (((frame + 1) & (ehci->periodic_size - 1))
2352                                       == clock_frame))
2353                                     && live
2354                                     && (q.sitd->hw_results &
2355                                         SITD_ACTIVE(ehci))) {
2356
2357                                         incomplete = true;
2358                                         q_p = &q.sitd->sitd_next;
2359                                         hw_p = &q.sitd->hw_next;
2360                                         type = Q_NEXT_TYPE(ehci,
2361                                                         q.sitd->hw_next);
2362                                         q = *q_p;
2363                                         break;
2364                                 }
2365
2366                                 /* Take finished SITDs out of the schedule
2367                                  * and process them:  recycle, maybe report
2368                                  * URB completion.
2369                                  */
2370                                 *q_p = q.sitd->sitd_next;
2371                                 *hw_p = q.sitd->hw_next;
2372                                 type = Q_NEXT_TYPE(ehci, q.sitd->hw_next);
2373                                 wmb();
2374                                 modified = sitd_complete (ehci, q.sitd);
2375                                 q = *q_p;
2376                                 break;
2377                         default:
2378                                 dbg ("corrupt type %d frame %d shadow %p",
2379                                         type, frame, q.ptr);
2380                                 // BUG ();
2381                                 q.ptr = NULL;
2382                         }
2383
2384                         /* assume completion callbacks modify the queue */
2385                         if (unlikely (modified)) {
2386                                 if (likely(ehci->periodic_sched > 0))
2387                                         goto restart;
2388                                 /* short-circuit this scan */
2389                                 now_uframe = clock;
2390                                 break;
2391                         }
2392                 }
2393
2394                 /* If we can tell we caught up to the hardware, stop now.
2395                  * We can't advance our scan without collecting the ISO
2396                  * transfers that are still pending in this frame.
2397                  */
2398                 if (incomplete && HC_IS_RUNNING(ehci_to_hcd(ehci)->state)) {
2399                         ehci->next_uframe = now_uframe;
2400                         break;
2401                 }
2402
2403                 // FIXME:  this assumes we won't get lapped when
2404                 // latencies climb; that should be rare, but...
2405                 // detect it, and just go all the way around.
2406                 // FLR might help detect this case, so long as latencies
2407                 // don't exceed periodic_size msec (default 1.024 sec).
2408
2409                 // FIXME:  likewise assumes HC doesn't halt mid-scan
2410
2411                 if (now_uframe == clock) {
2412                         unsigned        now;
2413
2414                         if (!HC_IS_RUNNING (ehci_to_hcd(ehci)->state)
2415                                         || ehci->periodic_sched == 0)
2416                                 break;
2417                         ehci->next_uframe = now_uframe;
2418                         now = ehci_readl(ehci, &ehci->regs->frame_index) &
2419                                         (mod - 1);
2420                         if (now_uframe == now)
2421                                 break;
2422
2423                         /* rescan the rest of this frame, then ... */
2424                         clock = now;
2425                         clock_frame = clock >> 3;
2426                         if (ehci->clock_frame != clock_frame) {
2427                                 free_cached_lists(ehci);
2428                                 ehci->clock_frame = clock_frame;
2429                         }
2430                 } else {
2431                         now_uframe++;
2432                         now_uframe &= mod - 1;
2433                 }
2434         }
2435 }