xref: /openbmc/linux/drivers/usb/musb/musb_host.c (revision e33bbe69149b802c0c77bfb822685772f85388ca)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * MUSB OTG driver host support
4  *
5  * Copyright 2005 Mentor Graphics Corporation
6  * Copyright (C) 2005-2006 by Texas Instruments
7  * Copyright (C) 2006-2007 Nokia Corporation
8  * Copyright (C) 2008-2009 MontaVista Software, Inc. <source@mvista.com>
9  */
10 
11 #include <linux/module.h>
12 #include <linux/kernel.h>
13 #include <linux/delay.h>
14 #include <linux/sched.h>
15 #include <linux/slab.h>
16 #include <linux/errno.h>
17 #include <linux/list.h>
18 #include <linux/dma-mapping.h>
19 
20 #include "musb_core.h"
21 #include "musb_host.h"
22 #include "musb_trace.h"
23 
24 /* MUSB HOST status 22-mar-2006
25  *
26  * - There's still lots of partial code duplication for fault paths, so
27  *   they aren't handled as consistently as they need to be.
28  *
29  * - PIO mostly behaved when last tested.
30  *     + including ep0, with all usbtest cases 9, 10
31  *     + usbtest 14 (ep0out) doesn't seem to run at all
32  *     + double buffered OUT/TX endpoints saw stalls(!) with certain usbtest
33  *       configurations, but otherwise double buffering passes basic tests.
34  *     + for 2.6.N, for N > ~10, needs API changes for hcd framework.
35  *
36  * - DMA (CPPI) ... partially behaves, not currently recommended
37  *     + about 1/15 the speed of typical EHCI implementations (PCI)
38  *     + RX, all too often reqpkt seems to misbehave after tx
39  *     + TX, no known issues (other than evident silicon issue)
40  *
41  * - DMA (Mentor/OMAP) ...has at least toggle update problems
42  *
43  * - [23-feb-2009] minimal traffic scheduling to avoid bulk RX packet
44  *   starvation ... nothing yet for TX, interrupt, or bulk.
45  *
46  * - Not tested with HNP, but some SRP paths seem to behave.
47  *
48  * NOTE 24-August-2006:
49  *
50  * - Bulk traffic finally uses both sides of hardware ep1, freeing up an
51  *   extra endpoint for periodic use enabling hub + keybd + mouse.  That
52  *   mostly works, except that with "usbnet" it's easy to trigger cases
53  *   with "ping" where RX loses.  (a) ping to davinci, even "ping -f",
54  *   fine; but (b) ping _from_ davinci, even "ping -c 1", ICMP RX loses
55  *   although ARP RX wins.  (That test was done with a full speed link.)
56  */
57 
58 
59 /*
60  * NOTE on endpoint usage:
61  *
62  * CONTROL transfers all go through ep0.  BULK ones go through dedicated IN
63  * and OUT endpoints ... hardware is dedicated for those "async" queue(s).
64  * (Yes, bulk _could_ use more of the endpoints than that, and would even
65  * benefit from it.)
66  *
67  * INTERUPPT and ISOCHRONOUS transfers are scheduled to the other endpoints.
68  * So far that scheduling is both dumb and optimistic:  the endpoint will be
69  * "claimed" until its software queue is no longer refilled.  No multiplexing
70  * of transfers between endpoints, or anything clever.
71  */
72 
73 struct musb *hcd_to_musb(struct usb_hcd *hcd)
74 {
75 	return *(struct musb **) hcd->hcd_priv;
76 }
77 
78 
79 static void musb_ep_program(struct musb *musb, u8 epnum,
80 			struct urb *urb, int is_out,
81 			u8 *buf, u32 offset, u32 len);
82 
83 /*
84  * Clear TX fifo. Needed to avoid BABBLE errors.
85  */
86 static void musb_h_tx_flush_fifo(struct musb_hw_ep *ep)
87 {
88 	struct musb	*musb = ep->musb;
89 	void __iomem	*epio = ep->regs;
90 	u16		csr;
91 	int		retries = 1000;
92 
93 	csr = musb_readw(epio, MUSB_TXCSR);
94 	while (csr & MUSB_TXCSR_FIFONOTEMPTY) {
95 		csr |= MUSB_TXCSR_FLUSHFIFO | MUSB_TXCSR_TXPKTRDY;
96 		musb_writew(epio, MUSB_TXCSR, csr);
97 		csr = musb_readw(epio, MUSB_TXCSR);
98 
99 		/*
100 		 * FIXME: sometimes the tx fifo flush failed, it has been
101 		 * observed during device disconnect on AM335x.
102 		 *
103 		 * To reproduce the issue, ensure tx urb(s) are queued when
104 		 * unplug the usb device which is connected to AM335x usb
105 		 * host port.
106 		 *
107 		 * I found using a usb-ethernet device and running iperf
108 		 * (client on AM335x) has very high chance to trigger it.
109 		 *
110 		 * Better to turn on musb_dbg() in musb_cleanup_urb() with
111 		 * CPPI enabled to see the issue when aborting the tx channel.
112 		 */
113 		if (dev_WARN_ONCE(musb->controller, retries-- < 1,
114 				"Could not flush host TX%d fifo: csr: %04x\n",
115 				ep->epnum, csr))
116 			return;
117 		mdelay(1);
118 	}
119 }
120 
121 static void musb_h_ep0_flush_fifo(struct musb_hw_ep *ep)
122 {
123 	void __iomem	*epio = ep->regs;
124 	u16		csr;
125 	int		retries = 5;
126 
127 	/* scrub any data left in the fifo */
128 	do {
129 		csr = musb_readw(epio, MUSB_TXCSR);
130 		if (!(csr & (MUSB_CSR0_TXPKTRDY | MUSB_CSR0_RXPKTRDY)))
131 			break;
132 		musb_writew(epio, MUSB_TXCSR, MUSB_CSR0_FLUSHFIFO);
133 		csr = musb_readw(epio, MUSB_TXCSR);
134 		udelay(10);
135 	} while (--retries);
136 
137 	WARN(!retries, "Could not flush host TX%d fifo: csr: %04x\n",
138 			ep->epnum, csr);
139 
140 	/* and reset for the next transfer */
141 	musb_writew(epio, MUSB_TXCSR, 0);
142 }
143 
144 /*
145  * Start transmit. Caller is responsible for locking shared resources.
146  * musb must be locked.
147  */
148 static inline void musb_h_tx_start(struct musb_hw_ep *ep)
149 {
150 	u16	txcsr;
151 
152 	/* NOTE: no locks here; caller should lock and select EP */
153 	if (ep->epnum) {
154 		txcsr = musb_readw(ep->regs, MUSB_TXCSR);
155 		txcsr |= MUSB_TXCSR_TXPKTRDY | MUSB_TXCSR_H_WZC_BITS;
156 		musb_writew(ep->regs, MUSB_TXCSR, txcsr);
157 	} else {
158 		txcsr = MUSB_CSR0_H_SETUPPKT | MUSB_CSR0_TXPKTRDY;
159 		musb_writew(ep->regs, MUSB_CSR0, txcsr);
160 	}
161 
162 }
163 
164 static inline void musb_h_tx_dma_start(struct musb_hw_ep *ep)
165 {
166 	u16	txcsr;
167 
168 	/* NOTE: no locks here; caller should lock and select EP */
169 	txcsr = musb_readw(ep->regs, MUSB_TXCSR);
170 	txcsr |= MUSB_TXCSR_DMAENAB | MUSB_TXCSR_H_WZC_BITS;
171 	if (is_cppi_enabled(ep->musb))
172 		txcsr |= MUSB_TXCSR_DMAMODE;
173 	musb_writew(ep->regs, MUSB_TXCSR, txcsr);
174 }
175 
176 static void musb_ep_set_qh(struct musb_hw_ep *ep, int is_in, struct musb_qh *qh)
177 {
178 	if (is_in != 0 || ep->is_shared_fifo)
179 		ep->in_qh  = qh;
180 	if (is_in == 0 || ep->is_shared_fifo)
181 		ep->out_qh = qh;
182 }
183 
184 static struct musb_qh *musb_ep_get_qh(struct musb_hw_ep *ep, int is_in)
185 {
186 	return is_in ? ep->in_qh : ep->out_qh;
187 }
188 
189 /*
190  * Start the URB at the front of an endpoint's queue
191  * end must be claimed from the caller.
192  *
193  * Context: controller locked, irqs blocked
194  */
195 static void
196 musb_start_urb(struct musb *musb, int is_in, struct musb_qh *qh)
197 {
198 	u32			len;
199 	void __iomem		*mbase =  musb->mregs;
200 	struct urb		*urb = next_urb(qh);
201 	void			*buf = urb->transfer_buffer;
202 	u32			offset = 0;
203 	struct musb_hw_ep	*hw_ep = qh->hw_ep;
204 	int			epnum = hw_ep->epnum;
205 
206 	/* initialize software qh state */
207 	qh->offset = 0;
208 	qh->segsize = 0;
209 
210 	/* gather right source of data */
211 	switch (qh->type) {
212 	case USB_ENDPOINT_XFER_CONTROL:
213 		/* control transfers always start with SETUP */
214 		is_in = 0;
215 		musb->ep0_stage = MUSB_EP0_START;
216 		buf = urb->setup_packet;
217 		len = 8;
218 		break;
219 	case USB_ENDPOINT_XFER_ISOC:
220 		qh->iso_idx = 0;
221 		qh->frame = 0;
222 		offset = urb->iso_frame_desc[0].offset;
223 		len = urb->iso_frame_desc[0].length;
224 		break;
225 	default:		/* bulk, interrupt */
226 		/* actual_length may be nonzero on retry paths */
227 		buf = urb->transfer_buffer + urb->actual_length;
228 		len = urb->transfer_buffer_length - urb->actual_length;
229 	}
230 
231 	trace_musb_urb_start(musb, urb);
232 
233 	/* Configure endpoint */
234 	musb_ep_set_qh(hw_ep, is_in, qh);
235 	musb_ep_program(musb, epnum, urb, !is_in, buf, offset, len);
236 
237 	/* transmit may have more work: start it when it is time */
238 	if (is_in)
239 		return;
240 
241 	/* determine if the time is right for a periodic transfer */
242 	switch (qh->type) {
243 	case USB_ENDPOINT_XFER_ISOC:
244 	case USB_ENDPOINT_XFER_INT:
245 		musb_dbg(musb, "check whether there's still time for periodic Tx");
246 		/* FIXME this doesn't implement that scheduling policy ...
247 		 * or handle framecounter wrapping
248 		 */
249 		if (1) {	/* Always assume URB_ISO_ASAP */
250 			/* REVISIT the SOF irq handler shouldn't duplicate
251 			 * this code; and we don't init urb->start_frame...
252 			 */
253 			qh->frame = 0;
254 			goto start;
255 		} else {
256 			qh->frame = urb->start_frame;
257 			/* enable SOF interrupt so we can count down */
258 			musb_dbg(musb, "SOF for %d", epnum);
259 #if 1 /* ifndef	CONFIG_ARCH_DAVINCI */
260 			musb_writeb(mbase, MUSB_INTRUSBE, 0xff);
261 #endif
262 		}
263 		break;
264 	default:
265 start:
266 		musb_dbg(musb, "Start TX%d %s", epnum,
267 			hw_ep->tx_channel ? "dma" : "pio");
268 
269 		if (!hw_ep->tx_channel)
270 			musb_h_tx_start(hw_ep);
271 		else if (is_cppi_enabled(musb) || tusb_dma_omap(musb))
272 			musb_h_tx_dma_start(hw_ep);
273 	}
274 }
275 
276 /* Context: caller owns controller lock, IRQs are blocked */
277 static void musb_giveback(struct musb *musb, struct urb *urb, int status)
278 __releases(musb->lock)
279 __acquires(musb->lock)
280 {
281 	trace_musb_urb_gb(musb, urb);
282 
283 	usb_hcd_unlink_urb_from_ep(musb->hcd, urb);
284 	spin_unlock(&musb->lock);
285 	usb_hcd_giveback_urb(musb->hcd, urb, status);
286 	spin_lock(&musb->lock);
287 }
288 
289 /* For bulk/interrupt endpoints only */
290 static inline void musb_save_toggle(struct musb_qh *qh, int is_in,
291 				    struct urb *urb)
292 {
293 	void __iomem		*epio = qh->hw_ep->regs;
294 	u16			csr;
295 
296 	/*
297 	 * FIXME: the current Mentor DMA code seems to have
298 	 * problems getting toggle correct.
299 	 */
300 
301 	if (is_in)
302 		csr = musb_readw(epio, MUSB_RXCSR) & MUSB_RXCSR_H_DATATOGGLE;
303 	else
304 		csr = musb_readw(epio, MUSB_TXCSR) & MUSB_TXCSR_H_DATATOGGLE;
305 
306 	usb_settoggle(urb->dev, qh->epnum, !is_in, csr ? 1 : 0);
307 }
308 
309 /*
310  * Advance this hardware endpoint's queue, completing the specified URB and
311  * advancing to either the next URB queued to that qh, or else invalidating
312  * that qh and advancing to the next qh scheduled after the current one.
313  *
314  * Context: caller owns controller lock, IRQs are blocked
315  */
316 static void musb_advance_schedule(struct musb *musb, struct urb *urb,
317 				  struct musb_hw_ep *hw_ep, int is_in)
318 {
319 	struct musb_qh		*qh = musb_ep_get_qh(hw_ep, is_in);
320 	struct musb_hw_ep	*ep = qh->hw_ep;
321 	int			ready = qh->is_ready;
322 	int			status;
323 
324 	status = (urb->status == -EINPROGRESS) ? 0 : urb->status;
325 
326 	/* save toggle eagerly, for paranoia */
327 	switch (qh->type) {
328 	case USB_ENDPOINT_XFER_BULK:
329 	case USB_ENDPOINT_XFER_INT:
330 		musb_save_toggle(qh, is_in, urb);
331 		break;
332 	case USB_ENDPOINT_XFER_ISOC:
333 		if (status == 0 && urb->error_count)
334 			status = -EXDEV;
335 		break;
336 	}
337 
338 	qh->is_ready = 0;
339 	musb_giveback(musb, urb, status);
340 	qh->is_ready = ready;
341 
342 	/* reclaim resources (and bandwidth) ASAP; deschedule it, and
343 	 * invalidate qh as soon as list_empty(&hep->urb_list)
344 	 */
345 	if (list_empty(&qh->hep->urb_list)) {
346 		struct list_head	*head;
347 		struct dma_controller	*dma = musb->dma_controller;
348 
349 		if (is_in) {
350 			ep->rx_reinit = 1;
351 			if (ep->rx_channel) {
352 				dma->channel_release(ep->rx_channel);
353 				ep->rx_channel = NULL;
354 			}
355 		} else {
356 			ep->tx_reinit = 1;
357 			if (ep->tx_channel) {
358 				dma->channel_release(ep->tx_channel);
359 				ep->tx_channel = NULL;
360 			}
361 		}
362 
363 		/* Clobber old pointers to this qh */
364 		musb_ep_set_qh(ep, is_in, NULL);
365 		qh->hep->hcpriv = NULL;
366 
367 		switch (qh->type) {
368 
369 		case USB_ENDPOINT_XFER_CONTROL:
370 		case USB_ENDPOINT_XFER_BULK:
371 			/* fifo policy for these lists, except that NAKing
372 			 * should rotate a qh to the end (for fairness).
373 			 */
374 			if (qh->mux == 1) {
375 				head = qh->ring.prev;
376 				list_del(&qh->ring);
377 				kfree(qh);
378 				qh = first_qh(head);
379 				break;
380 			}
381 
382 		case USB_ENDPOINT_XFER_ISOC:
383 		case USB_ENDPOINT_XFER_INT:
384 			/* this is where periodic bandwidth should be
385 			 * de-allocated if it's tracked and allocated;
386 			 * and where we'd update the schedule tree...
387 			 */
388 			kfree(qh);
389 			qh = NULL;
390 			break;
391 		}
392 	}
393 
394 	if (qh != NULL && qh->is_ready) {
395 		musb_dbg(musb, "... next ep%d %cX urb %p",
396 		    hw_ep->epnum, is_in ? 'R' : 'T', next_urb(qh));
397 		musb_start_urb(musb, is_in, qh);
398 	}
399 }
400 
401 static u16 musb_h_flush_rxfifo(struct musb_hw_ep *hw_ep, u16 csr)
402 {
403 	/* we don't want fifo to fill itself again;
404 	 * ignore dma (various models),
405 	 * leave toggle alone (may not have been saved yet)
406 	 */
407 	csr |= MUSB_RXCSR_FLUSHFIFO | MUSB_RXCSR_RXPKTRDY;
408 	csr &= ~(MUSB_RXCSR_H_REQPKT
409 		| MUSB_RXCSR_H_AUTOREQ
410 		| MUSB_RXCSR_AUTOCLEAR);
411 
412 	/* write 2x to allow double buffering */
413 	musb_writew(hw_ep->regs, MUSB_RXCSR, csr);
414 	musb_writew(hw_ep->regs, MUSB_RXCSR, csr);
415 
416 	/* flush writebuffer */
417 	return musb_readw(hw_ep->regs, MUSB_RXCSR);
418 }
419 
420 /*
421  * PIO RX for a packet (or part of it).
422  */
423 static bool
424 musb_host_packet_rx(struct musb *musb, struct urb *urb, u8 epnum, u8 iso_err)
425 {
426 	u16			rx_count;
427 	u8			*buf;
428 	u16			csr;
429 	bool			done = false;
430 	u32			length;
431 	int			do_flush = 0;
432 	struct musb_hw_ep	*hw_ep = musb->endpoints + epnum;
433 	void __iomem		*epio = hw_ep->regs;
434 	struct musb_qh		*qh = hw_ep->in_qh;
435 	int			pipe = urb->pipe;
436 	void			*buffer = urb->transfer_buffer;
437 
438 	/* musb_ep_select(mbase, epnum); */
439 	rx_count = musb_readw(epio, MUSB_RXCOUNT);
440 	musb_dbg(musb, "RX%d count %d, buffer %p len %d/%d", epnum, rx_count,
441 			urb->transfer_buffer, qh->offset,
442 			urb->transfer_buffer_length);
443 
444 	/* unload FIFO */
445 	if (usb_pipeisoc(pipe)) {
446 		int					status = 0;
447 		struct usb_iso_packet_descriptor	*d;
448 
449 		if (iso_err) {
450 			status = -EILSEQ;
451 			urb->error_count++;
452 		}
453 
454 		d = urb->iso_frame_desc + qh->iso_idx;
455 		buf = buffer + d->offset;
456 		length = d->length;
457 		if (rx_count > length) {
458 			if (status == 0) {
459 				status = -EOVERFLOW;
460 				urb->error_count++;
461 			}
462 			musb_dbg(musb, "OVERFLOW %d into %d", rx_count, length);
463 			do_flush = 1;
464 		} else
465 			length = rx_count;
466 		urb->actual_length += length;
467 		d->actual_length = length;
468 
469 		d->status = status;
470 
471 		/* see if we are done */
472 		done = (++qh->iso_idx >= urb->number_of_packets);
473 	} else {
474 		/* non-isoch */
475 		buf = buffer + qh->offset;
476 		length = urb->transfer_buffer_length - qh->offset;
477 		if (rx_count > length) {
478 			if (urb->status == -EINPROGRESS)
479 				urb->status = -EOVERFLOW;
480 			musb_dbg(musb, "OVERFLOW %d into %d", rx_count, length);
481 			do_flush = 1;
482 		} else
483 			length = rx_count;
484 		urb->actual_length += length;
485 		qh->offset += length;
486 
487 		/* see if we are done */
488 		done = (urb->actual_length == urb->transfer_buffer_length)
489 			|| (rx_count < qh->maxpacket)
490 			|| (urb->status != -EINPROGRESS);
491 		if (done
492 				&& (urb->status == -EINPROGRESS)
493 				&& (urb->transfer_flags & URB_SHORT_NOT_OK)
494 				&& (urb->actual_length
495 					< urb->transfer_buffer_length))
496 			urb->status = -EREMOTEIO;
497 	}
498 
499 	musb_read_fifo(hw_ep, length, buf);
500 
501 	csr = musb_readw(epio, MUSB_RXCSR);
502 	csr |= MUSB_RXCSR_H_WZC_BITS;
503 	if (unlikely(do_flush))
504 		musb_h_flush_rxfifo(hw_ep, csr);
505 	else {
506 		/* REVISIT this assumes AUTOCLEAR is never set */
507 		csr &= ~(MUSB_RXCSR_RXPKTRDY | MUSB_RXCSR_H_REQPKT);
508 		if (!done)
509 			csr |= MUSB_RXCSR_H_REQPKT;
510 		musb_writew(epio, MUSB_RXCSR, csr);
511 	}
512 
513 	return done;
514 }
515 
516 /* we don't always need to reinit a given side of an endpoint...
517  * when we do, use tx/rx reinit routine and then construct a new CSR
518  * to address data toggle, NYET, and DMA or PIO.
519  *
520  * it's possible that driver bugs (especially for DMA) or aborting a
521  * transfer might have left the endpoint busier than it should be.
522  * the busy/not-empty tests are basically paranoia.
523  */
524 static void
525 musb_rx_reinit(struct musb *musb, struct musb_qh *qh, u8 epnum)
526 {
527 	struct musb_hw_ep *ep = musb->endpoints + epnum;
528 	u16	csr;
529 
530 	/* NOTE:  we know the "rx" fifo reinit never triggers for ep0.
531 	 * That always uses tx_reinit since ep0 repurposes TX register
532 	 * offsets; the initial SETUP packet is also a kind of OUT.
533 	 */
534 
535 	/* if programmed for Tx, put it in RX mode */
536 	if (ep->is_shared_fifo) {
537 		csr = musb_readw(ep->regs, MUSB_TXCSR);
538 		if (csr & MUSB_TXCSR_MODE) {
539 			musb_h_tx_flush_fifo(ep);
540 			csr = musb_readw(ep->regs, MUSB_TXCSR);
541 			musb_writew(ep->regs, MUSB_TXCSR,
542 				    csr | MUSB_TXCSR_FRCDATATOG);
543 		}
544 
545 		/*
546 		 * Clear the MODE bit (and everything else) to enable Rx.
547 		 * NOTE: we mustn't clear the DMAMODE bit before DMAENAB.
548 		 */
549 		if (csr & MUSB_TXCSR_DMAMODE)
550 			musb_writew(ep->regs, MUSB_TXCSR, MUSB_TXCSR_DMAMODE);
551 		musb_writew(ep->regs, MUSB_TXCSR, 0);
552 
553 	/* scrub all previous state, clearing toggle */
554 	}
555 	csr = musb_readw(ep->regs, MUSB_RXCSR);
556 	if (csr & MUSB_RXCSR_RXPKTRDY)
557 		WARNING("rx%d, packet/%d ready?\n", ep->epnum,
558 			musb_readw(ep->regs, MUSB_RXCOUNT));
559 
560 	musb_h_flush_rxfifo(ep, MUSB_RXCSR_CLRDATATOG);
561 
562 	/* target addr and (for multipoint) hub addr/port */
563 	if (musb->is_multipoint) {
564 		musb_write_rxfunaddr(musb, epnum, qh->addr_reg);
565 		musb_write_rxhubaddr(musb, epnum, qh->h_addr_reg);
566 		musb_write_rxhubport(musb, epnum, qh->h_port_reg);
567 	} else
568 		musb_writeb(musb->mregs, MUSB_FADDR, qh->addr_reg);
569 
570 	/* protocol/endpoint, interval/NAKlimit, i/o size */
571 	musb_writeb(ep->regs, MUSB_RXTYPE, qh->type_reg);
572 	musb_writeb(ep->regs, MUSB_RXINTERVAL, qh->intv_reg);
573 	/* NOTE: bulk combining rewrites high bits of maxpacket */
574 	/* Set RXMAXP with the FIFO size of the endpoint
575 	 * to disable double buffer mode.
576 	 */
577 	musb_writew(ep->regs, MUSB_RXMAXP,
578 			qh->maxpacket | ((qh->hb_mult - 1) << 11));
579 
580 	ep->rx_reinit = 0;
581 }
582 
583 static void musb_tx_dma_set_mode_mentor(struct dma_controller *dma,
584 		struct musb_hw_ep *hw_ep, struct musb_qh *qh,
585 		struct urb *urb, u32 offset,
586 		u32 *length, u8 *mode)
587 {
588 	struct dma_channel	*channel = hw_ep->tx_channel;
589 	void __iomem		*epio = hw_ep->regs;
590 	u16			pkt_size = qh->maxpacket;
591 	u16			csr;
592 
593 	if (*length > channel->max_len)
594 		*length = channel->max_len;
595 
596 	csr = musb_readw(epio, MUSB_TXCSR);
597 	if (*length > pkt_size) {
598 		*mode = 1;
599 		csr |= MUSB_TXCSR_DMAMODE | MUSB_TXCSR_DMAENAB;
600 		/* autoset shouldn't be set in high bandwidth */
601 		/*
602 		 * Enable Autoset according to table
603 		 * below
604 		 * bulk_split hb_mult	Autoset_Enable
605 		 *	0	1	Yes(Normal)
606 		 *	0	>1	No(High BW ISO)
607 		 *	1	1	Yes(HS bulk)
608 		 *	1	>1	Yes(FS bulk)
609 		 */
610 		if (qh->hb_mult == 1 || (qh->hb_mult > 1 &&
611 					can_bulk_split(hw_ep->musb, qh->type)))
612 			csr |= MUSB_TXCSR_AUTOSET;
613 	} else {
614 		*mode = 0;
615 		csr &= ~(MUSB_TXCSR_AUTOSET | MUSB_TXCSR_DMAMODE);
616 		csr |= MUSB_TXCSR_DMAENAB; /* against programmer's guide */
617 	}
618 	channel->desired_mode = *mode;
619 	musb_writew(epio, MUSB_TXCSR, csr);
620 }
621 
622 static void musb_tx_dma_set_mode_cppi_tusb(struct dma_controller *dma,
623 					   struct musb_hw_ep *hw_ep,
624 					   struct musb_qh *qh,
625 					   struct urb *urb,
626 					   u32 offset,
627 					   u32 *length,
628 					   u8 *mode)
629 {
630 	struct dma_channel *channel = hw_ep->tx_channel;
631 
632 	channel->actual_len = 0;
633 
634 	/*
635 	 * TX uses "RNDIS" mode automatically but needs help
636 	 * to identify the zero-length-final-packet case.
637 	 */
638 	*mode = (urb->transfer_flags & URB_ZERO_PACKET) ? 1 : 0;
639 }
640 
641 static bool musb_tx_dma_program(struct dma_controller *dma,
642 		struct musb_hw_ep *hw_ep, struct musb_qh *qh,
643 		struct urb *urb, u32 offset, u32 length)
644 {
645 	struct dma_channel	*channel = hw_ep->tx_channel;
646 	u16			pkt_size = qh->maxpacket;
647 	u8			mode;
648 
649 	if (musb_dma_inventra(hw_ep->musb) || musb_dma_ux500(hw_ep->musb))
650 		musb_tx_dma_set_mode_mentor(dma, hw_ep, qh, urb, offset,
651 					    &length, &mode);
652 	else if (is_cppi_enabled(hw_ep->musb) || tusb_dma_omap(hw_ep->musb))
653 		musb_tx_dma_set_mode_cppi_tusb(dma, hw_ep, qh, urb, offset,
654 					       &length, &mode);
655 	else
656 		return false;
657 
658 	qh->segsize = length;
659 
660 	/*
661 	 * Ensure the data reaches to main memory before starting
662 	 * DMA transfer
663 	 */
664 	wmb();
665 
666 	if (!dma->channel_program(channel, pkt_size, mode,
667 			urb->transfer_dma + offset, length)) {
668 		void __iomem *epio = hw_ep->regs;
669 		u16 csr;
670 
671 		dma->channel_release(channel);
672 		hw_ep->tx_channel = NULL;
673 
674 		csr = musb_readw(epio, MUSB_TXCSR);
675 		csr &= ~(MUSB_TXCSR_AUTOSET | MUSB_TXCSR_DMAENAB);
676 		musb_writew(epio, MUSB_TXCSR, csr | MUSB_TXCSR_H_WZC_BITS);
677 		return false;
678 	}
679 	return true;
680 }
681 
682 /*
683  * Program an HDRC endpoint as per the given URB
684  * Context: irqs blocked, controller lock held
685  */
686 static void musb_ep_program(struct musb *musb, u8 epnum,
687 			struct urb *urb, int is_out,
688 			u8 *buf, u32 offset, u32 len)
689 {
690 	struct dma_controller	*dma_controller;
691 	struct dma_channel	*dma_channel;
692 	u8			dma_ok;
693 	void __iomem		*mbase = musb->mregs;
694 	struct musb_hw_ep	*hw_ep = musb->endpoints + epnum;
695 	void __iomem		*epio = hw_ep->regs;
696 	struct musb_qh		*qh = musb_ep_get_qh(hw_ep, !is_out);
697 	u16			packet_sz = qh->maxpacket;
698 	u8			use_dma = 1;
699 	u16			csr;
700 
701 	musb_dbg(musb, "%s hw%d urb %p spd%d dev%d ep%d%s "
702 				"h_addr%02x h_port%02x bytes %d",
703 			is_out ? "-->" : "<--",
704 			epnum, urb, urb->dev->speed,
705 			qh->addr_reg, qh->epnum, is_out ? "out" : "in",
706 			qh->h_addr_reg, qh->h_port_reg,
707 			len);
708 
709 	musb_ep_select(mbase, epnum);
710 
711 	if (is_out && !len) {
712 		use_dma = 0;
713 		csr = musb_readw(epio, MUSB_TXCSR);
714 		csr &= ~MUSB_TXCSR_DMAENAB;
715 		musb_writew(epio, MUSB_TXCSR, csr);
716 		hw_ep->tx_channel = NULL;
717 	}
718 
719 	/* candidate for DMA? */
720 	dma_controller = musb->dma_controller;
721 	if (use_dma && is_dma_capable() && epnum && dma_controller) {
722 		dma_channel = is_out ? hw_ep->tx_channel : hw_ep->rx_channel;
723 		if (!dma_channel) {
724 			dma_channel = dma_controller->channel_alloc(
725 					dma_controller, hw_ep, is_out);
726 			if (is_out)
727 				hw_ep->tx_channel = dma_channel;
728 			else
729 				hw_ep->rx_channel = dma_channel;
730 		}
731 	} else
732 		dma_channel = NULL;
733 
734 	/* make sure we clear DMAEnab, autoSet bits from previous run */
735 
736 	/* OUT/transmit/EP0 or IN/receive? */
737 	if (is_out) {
738 		u16	csr;
739 		u16	int_txe;
740 		u16	load_count;
741 
742 		csr = musb_readw(epio, MUSB_TXCSR);
743 
744 		/* disable interrupt in case we flush */
745 		int_txe = musb->intrtxe;
746 		musb_writew(mbase, MUSB_INTRTXE, int_txe & ~(1 << epnum));
747 
748 		/* general endpoint setup */
749 		if (epnum) {
750 			/* flush all old state, set default */
751 			/*
752 			 * We could be flushing valid
753 			 * packets in double buffering
754 			 * case
755 			 */
756 			if (!hw_ep->tx_double_buffered)
757 				musb_h_tx_flush_fifo(hw_ep);
758 
759 			/*
760 			 * We must not clear the DMAMODE bit before or in
761 			 * the same cycle with the DMAENAB bit, so we clear
762 			 * the latter first...
763 			 */
764 			csr &= ~(MUSB_TXCSR_H_NAKTIMEOUT
765 					| MUSB_TXCSR_AUTOSET
766 					| MUSB_TXCSR_DMAENAB
767 					| MUSB_TXCSR_FRCDATATOG
768 					| MUSB_TXCSR_H_RXSTALL
769 					| MUSB_TXCSR_H_ERROR
770 					| MUSB_TXCSR_TXPKTRDY
771 					);
772 			csr |= MUSB_TXCSR_MODE;
773 
774 			if (!hw_ep->tx_double_buffered) {
775 				if (usb_gettoggle(urb->dev, qh->epnum, 1))
776 					csr |= MUSB_TXCSR_H_WR_DATATOGGLE
777 						| MUSB_TXCSR_H_DATATOGGLE;
778 				else
779 					csr |= MUSB_TXCSR_CLRDATATOG;
780 			}
781 
782 			musb_writew(epio, MUSB_TXCSR, csr);
783 			/* REVISIT may need to clear FLUSHFIFO ... */
784 			csr &= ~MUSB_TXCSR_DMAMODE;
785 			musb_writew(epio, MUSB_TXCSR, csr);
786 			csr = musb_readw(epio, MUSB_TXCSR);
787 		} else {
788 			/* endpoint 0: just flush */
789 			musb_h_ep0_flush_fifo(hw_ep);
790 		}
791 
792 		/* target addr and (for multipoint) hub addr/port */
793 		if (musb->is_multipoint) {
794 			musb_write_txfunaddr(musb, epnum, qh->addr_reg);
795 			musb_write_txhubaddr(musb, epnum, qh->h_addr_reg);
796 			musb_write_txhubport(musb, epnum, qh->h_port_reg);
797 /* FIXME if !epnum, do the same for RX ... */
798 		} else
799 			musb_writeb(mbase, MUSB_FADDR, qh->addr_reg);
800 
801 		/* protocol/endpoint/interval/NAKlimit */
802 		if (epnum) {
803 			musb_writeb(epio, MUSB_TXTYPE, qh->type_reg);
804 			if (can_bulk_split(musb, qh->type)) {
805 				qh->hb_mult = hw_ep->max_packet_sz_tx
806 						/ packet_sz;
807 				musb_writew(epio, MUSB_TXMAXP, packet_sz
808 					| ((qh->hb_mult) - 1) << 11);
809 			} else {
810 				musb_writew(epio, MUSB_TXMAXP,
811 						qh->maxpacket |
812 						((qh->hb_mult - 1) << 11));
813 			}
814 			musb_writeb(epio, MUSB_TXINTERVAL, qh->intv_reg);
815 		} else {
816 			musb_writeb(epio, MUSB_NAKLIMIT0, qh->intv_reg);
817 			if (musb->is_multipoint)
818 				musb_writeb(epio, MUSB_TYPE0,
819 						qh->type_reg);
820 		}
821 
822 		if (can_bulk_split(musb, qh->type))
823 			load_count = min((u32) hw_ep->max_packet_sz_tx,
824 						len);
825 		else
826 			load_count = min((u32) packet_sz, len);
827 
828 		if (dma_channel && musb_tx_dma_program(dma_controller,
829 					hw_ep, qh, urb, offset, len))
830 			load_count = 0;
831 
832 		if (load_count) {
833 			/* PIO to load FIFO */
834 			qh->segsize = load_count;
835 			if (!buf) {
836 				sg_miter_start(&qh->sg_miter, urb->sg, 1,
837 						SG_MITER_ATOMIC
838 						| SG_MITER_FROM_SG);
839 				if (!sg_miter_next(&qh->sg_miter)) {
840 					dev_err(musb->controller,
841 							"error: sg"
842 							"list empty\n");
843 					sg_miter_stop(&qh->sg_miter);
844 					goto finish;
845 				}
846 				buf = qh->sg_miter.addr + urb->sg->offset +
847 					urb->actual_length;
848 				load_count = min_t(u32, load_count,
849 						qh->sg_miter.length);
850 				musb_write_fifo(hw_ep, load_count, buf);
851 				qh->sg_miter.consumed = load_count;
852 				sg_miter_stop(&qh->sg_miter);
853 			} else
854 				musb_write_fifo(hw_ep, load_count, buf);
855 		}
856 finish:
857 		/* re-enable interrupt */
858 		musb_writew(mbase, MUSB_INTRTXE, int_txe);
859 
860 	/* IN/receive */
861 	} else {
862 		u16	csr;
863 
864 		if (hw_ep->rx_reinit) {
865 			musb_rx_reinit(musb, qh, epnum);
866 
867 			/* init new state: toggle and NYET, maybe DMA later */
868 			if (usb_gettoggle(urb->dev, qh->epnum, 0))
869 				csr = MUSB_RXCSR_H_WR_DATATOGGLE
870 					| MUSB_RXCSR_H_DATATOGGLE;
871 			else
872 				csr = 0;
873 			if (qh->type == USB_ENDPOINT_XFER_INT)
874 				csr |= MUSB_RXCSR_DISNYET;
875 
876 		} else {
877 			csr = musb_readw(hw_ep->regs, MUSB_RXCSR);
878 
879 			if (csr & (MUSB_RXCSR_RXPKTRDY
880 					| MUSB_RXCSR_DMAENAB
881 					| MUSB_RXCSR_H_REQPKT))
882 				ERR("broken !rx_reinit, ep%d csr %04x\n",
883 						hw_ep->epnum, csr);
884 
885 			/* scrub any stale state, leaving toggle alone */
886 			csr &= MUSB_RXCSR_DISNYET;
887 		}
888 
889 		/* kick things off */
890 
891 		if ((is_cppi_enabled(musb) || tusb_dma_omap(musb)) && dma_channel) {
892 			/* Candidate for DMA */
893 			dma_channel->actual_len = 0L;
894 			qh->segsize = len;
895 
896 			/* AUTOREQ is in a DMA register */
897 			musb_writew(hw_ep->regs, MUSB_RXCSR, csr);
898 			csr = musb_readw(hw_ep->regs, MUSB_RXCSR);
899 
900 			/*
901 			 * Unless caller treats short RX transfers as
902 			 * errors, we dare not queue multiple transfers.
903 			 */
904 			dma_ok = dma_controller->channel_program(dma_channel,
905 					packet_sz, !(urb->transfer_flags &
906 						     URB_SHORT_NOT_OK),
907 					urb->transfer_dma + offset,
908 					qh->segsize);
909 			if (!dma_ok) {
910 				dma_controller->channel_release(dma_channel);
911 				hw_ep->rx_channel = dma_channel = NULL;
912 			} else
913 				csr |= MUSB_RXCSR_DMAENAB;
914 		}
915 
916 		csr |= MUSB_RXCSR_H_REQPKT;
917 		musb_dbg(musb, "RXCSR%d := %04x", epnum, csr);
918 		musb_writew(hw_ep->regs, MUSB_RXCSR, csr);
919 		csr = musb_readw(hw_ep->regs, MUSB_RXCSR);
920 	}
921 }
922 
923 /* Schedule next QH from musb->in_bulk/out_bulk and move the current qh to
924  * the end; avoids starvation for other endpoints.
925  */
926 static void musb_bulk_nak_timeout(struct musb *musb, struct musb_hw_ep *ep,
927 	int is_in)
928 {
929 	struct dma_channel	*dma;
930 	struct urb		*urb;
931 	void __iomem		*mbase = musb->mregs;
932 	void __iomem		*epio = ep->regs;
933 	struct musb_qh		*cur_qh, *next_qh;
934 	u16			rx_csr, tx_csr;
935 
936 	musb_ep_select(mbase, ep->epnum);
937 	if (is_in) {
938 		dma = is_dma_capable() ? ep->rx_channel : NULL;
939 
940 		/*
941 		 * Need to stop the transaction by clearing REQPKT first
942 		 * then the NAK Timeout bit ref MUSBMHDRC USB 2.0 HIGH-SPEED
943 		 * DUAL-ROLE CONTROLLER Programmer's Guide, section 9.2.2
944 		 */
945 		rx_csr = musb_readw(epio, MUSB_RXCSR);
946 		rx_csr |= MUSB_RXCSR_H_WZC_BITS;
947 		rx_csr &= ~MUSB_RXCSR_H_REQPKT;
948 		musb_writew(epio, MUSB_RXCSR, rx_csr);
949 		rx_csr &= ~MUSB_RXCSR_DATAERROR;
950 		musb_writew(epio, MUSB_RXCSR, rx_csr);
951 
952 		cur_qh = first_qh(&musb->in_bulk);
953 	} else {
954 		dma = is_dma_capable() ? ep->tx_channel : NULL;
955 
956 		/* clear nak timeout bit */
957 		tx_csr = musb_readw(epio, MUSB_TXCSR);
958 		tx_csr |= MUSB_TXCSR_H_WZC_BITS;
959 		tx_csr &= ~MUSB_TXCSR_H_NAKTIMEOUT;
960 		musb_writew(epio, MUSB_TXCSR, tx_csr);
961 
962 		cur_qh = first_qh(&musb->out_bulk);
963 	}
964 	if (cur_qh) {
965 		urb = next_urb(cur_qh);
966 		if (dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY) {
967 			dma->status = MUSB_DMA_STATUS_CORE_ABORT;
968 			musb->dma_controller->channel_abort(dma);
969 			urb->actual_length += dma->actual_len;
970 			dma->actual_len = 0L;
971 		}
972 		musb_save_toggle(cur_qh, is_in, urb);
973 
974 		if (is_in) {
975 			/* move cur_qh to end of queue */
976 			list_move_tail(&cur_qh->ring, &musb->in_bulk);
977 
978 			/* get the next qh from musb->in_bulk */
979 			next_qh = first_qh(&musb->in_bulk);
980 
981 			/* set rx_reinit and schedule the next qh */
982 			ep->rx_reinit = 1;
983 		} else {
984 			/* move cur_qh to end of queue */
985 			list_move_tail(&cur_qh->ring, &musb->out_bulk);
986 
987 			/* get the next qh from musb->out_bulk */
988 			next_qh = first_qh(&musb->out_bulk);
989 
990 			/* set tx_reinit and schedule the next qh */
991 			ep->tx_reinit = 1;
992 		}
993 		musb_start_urb(musb, is_in, next_qh);
994 	}
995 }
996 
997 /*
998  * Service the default endpoint (ep0) as host.
999  * Return true until it's time to start the status stage.
1000  */
1001 static bool musb_h_ep0_continue(struct musb *musb, u16 len, struct urb *urb)
1002 {
1003 	bool			 more = false;
1004 	u8			*fifo_dest = NULL;
1005 	u16			fifo_count = 0;
1006 	struct musb_hw_ep	*hw_ep = musb->control_ep;
1007 	struct musb_qh		*qh = hw_ep->in_qh;
1008 	struct usb_ctrlrequest	*request;
1009 
1010 	switch (musb->ep0_stage) {
1011 	case MUSB_EP0_IN:
1012 		fifo_dest = urb->transfer_buffer + urb->actual_length;
1013 		fifo_count = min_t(size_t, len, urb->transfer_buffer_length -
1014 				   urb->actual_length);
1015 		if (fifo_count < len)
1016 			urb->status = -EOVERFLOW;
1017 
1018 		musb_read_fifo(hw_ep, fifo_count, fifo_dest);
1019 
1020 		urb->actual_length += fifo_count;
1021 		if (len < qh->maxpacket) {
1022 			/* always terminate on short read; it's
1023 			 * rarely reported as an error.
1024 			 */
1025 		} else if (urb->actual_length <
1026 				urb->transfer_buffer_length)
1027 			more = true;
1028 		break;
1029 	case MUSB_EP0_START:
1030 		request = (struct usb_ctrlrequest *) urb->setup_packet;
1031 
1032 		if (!request->wLength) {
1033 			musb_dbg(musb, "start no-DATA");
1034 			break;
1035 		} else if (request->bRequestType & USB_DIR_IN) {
1036 			musb_dbg(musb, "start IN-DATA");
1037 			musb->ep0_stage = MUSB_EP0_IN;
1038 			more = true;
1039 			break;
1040 		} else {
1041 			musb_dbg(musb, "start OUT-DATA");
1042 			musb->ep0_stage = MUSB_EP0_OUT;
1043 			more = true;
1044 		}
1045 		/* FALLTHROUGH */
1046 	case MUSB_EP0_OUT:
1047 		fifo_count = min_t(size_t, qh->maxpacket,
1048 				   urb->transfer_buffer_length -
1049 				   urb->actual_length);
1050 		if (fifo_count) {
1051 			fifo_dest = (u8 *) (urb->transfer_buffer
1052 					+ urb->actual_length);
1053 			musb_dbg(musb, "Sending %d byte%s to ep0 fifo %p",
1054 					fifo_count,
1055 					(fifo_count == 1) ? "" : "s",
1056 					fifo_dest);
1057 			musb_write_fifo(hw_ep, fifo_count, fifo_dest);
1058 
1059 			urb->actual_length += fifo_count;
1060 			more = true;
1061 		}
1062 		break;
1063 	default:
1064 		ERR("bogus ep0 stage %d\n", musb->ep0_stage);
1065 		break;
1066 	}
1067 
1068 	return more;
1069 }
1070 
1071 /*
1072  * Handle default endpoint interrupt as host. Only called in IRQ time
1073  * from musb_interrupt().
1074  *
1075  * called with controller irqlocked
1076  */
1077 irqreturn_t musb_h_ep0_irq(struct musb *musb)
1078 {
1079 	struct urb		*urb;
1080 	u16			csr, len;
1081 	int			status = 0;
1082 	void __iomem		*mbase = musb->mregs;
1083 	struct musb_hw_ep	*hw_ep = musb->control_ep;
1084 	void __iomem		*epio = hw_ep->regs;
1085 	struct musb_qh		*qh = hw_ep->in_qh;
1086 	bool			complete = false;
1087 	irqreturn_t		retval = IRQ_NONE;
1088 
1089 	/* ep0 only has one queue, "in" */
1090 	urb = next_urb(qh);
1091 
1092 	musb_ep_select(mbase, 0);
1093 	csr = musb_readw(epio, MUSB_CSR0);
1094 	len = (csr & MUSB_CSR0_RXPKTRDY)
1095 			? musb_readb(epio, MUSB_COUNT0)
1096 			: 0;
1097 
1098 	musb_dbg(musb, "<== csr0 %04x, qh %p, count %d, urb %p, stage %d",
1099 		csr, qh, len, urb, musb->ep0_stage);
1100 
1101 	/* if we just did status stage, we are done */
1102 	if (MUSB_EP0_STATUS == musb->ep0_stage) {
1103 		retval = IRQ_HANDLED;
1104 		complete = true;
1105 	}
1106 
1107 	/* prepare status */
1108 	if (csr & MUSB_CSR0_H_RXSTALL) {
1109 		musb_dbg(musb, "STALLING ENDPOINT");
1110 		status = -EPIPE;
1111 
1112 	} else if (csr & MUSB_CSR0_H_ERROR) {
1113 		musb_dbg(musb, "no response, csr0 %04x", csr);
1114 		status = -EPROTO;
1115 
1116 	} else if (csr & MUSB_CSR0_H_NAKTIMEOUT) {
1117 		musb_dbg(musb, "control NAK timeout");
1118 
1119 		/* NOTE:  this code path would be a good place to PAUSE a
1120 		 * control transfer, if another one is queued, so that
1121 		 * ep0 is more likely to stay busy.  That's already done
1122 		 * for bulk RX transfers.
1123 		 *
1124 		 * if (qh->ring.next != &musb->control), then
1125 		 * we have a candidate... NAKing is *NOT* an error
1126 		 */
1127 		musb_writew(epio, MUSB_CSR0, 0);
1128 		retval = IRQ_HANDLED;
1129 	}
1130 
1131 	if (status) {
1132 		musb_dbg(musb, "aborting");
1133 		retval = IRQ_HANDLED;
1134 		if (urb)
1135 			urb->status = status;
1136 		complete = true;
1137 
1138 		/* use the proper sequence to abort the transfer */
1139 		if (csr & MUSB_CSR0_H_REQPKT) {
1140 			csr &= ~MUSB_CSR0_H_REQPKT;
1141 			musb_writew(epio, MUSB_CSR0, csr);
1142 			csr &= ~MUSB_CSR0_H_NAKTIMEOUT;
1143 			musb_writew(epio, MUSB_CSR0, csr);
1144 		} else {
1145 			musb_h_ep0_flush_fifo(hw_ep);
1146 		}
1147 
1148 		musb_writeb(epio, MUSB_NAKLIMIT0, 0);
1149 
1150 		/* clear it */
1151 		musb_writew(epio, MUSB_CSR0, 0);
1152 	}
1153 
1154 	if (unlikely(!urb)) {
1155 		/* stop endpoint since we have no place for its data, this
1156 		 * SHOULD NEVER HAPPEN! */
1157 		ERR("no URB for end 0\n");
1158 
1159 		musb_h_ep0_flush_fifo(hw_ep);
1160 		goto done;
1161 	}
1162 
1163 	if (!complete) {
1164 		/* call common logic and prepare response */
1165 		if (musb_h_ep0_continue(musb, len, urb)) {
1166 			/* more packets required */
1167 			csr = (MUSB_EP0_IN == musb->ep0_stage)
1168 				?  MUSB_CSR0_H_REQPKT : MUSB_CSR0_TXPKTRDY;
1169 		} else {
1170 			/* data transfer complete; perform status phase */
1171 			if (usb_pipeout(urb->pipe)
1172 					|| !urb->transfer_buffer_length)
1173 				csr = MUSB_CSR0_H_STATUSPKT
1174 					| MUSB_CSR0_H_REQPKT;
1175 			else
1176 				csr = MUSB_CSR0_H_STATUSPKT
1177 					| MUSB_CSR0_TXPKTRDY;
1178 
1179 			/* disable ping token in status phase */
1180 			csr |= MUSB_CSR0_H_DIS_PING;
1181 
1182 			/* flag status stage */
1183 			musb->ep0_stage = MUSB_EP0_STATUS;
1184 
1185 			musb_dbg(musb, "ep0 STATUS, csr %04x", csr);
1186 
1187 		}
1188 		musb_writew(epio, MUSB_CSR0, csr);
1189 		retval = IRQ_HANDLED;
1190 	} else
1191 		musb->ep0_stage = MUSB_EP0_IDLE;
1192 
1193 	/* call completion handler if done */
1194 	if (complete)
1195 		musb_advance_schedule(musb, urb, hw_ep, 1);
1196 done:
1197 	return retval;
1198 }
1199 
1200 
1201 #ifdef CONFIG_USB_INVENTRA_DMA
1202 
1203 /* Host side TX (OUT) using Mentor DMA works as follows:
1204 	submit_urb ->
1205 		- if queue was empty, Program Endpoint
1206 		- ... which starts DMA to fifo in mode 1 or 0
1207 
1208 	DMA Isr (transfer complete) -> TxAvail()
1209 		- Stop DMA (~DmaEnab)	(<--- Alert ... currently happens
1210 					only in musb_cleanup_urb)
1211 		- TxPktRdy has to be set in mode 0 or for
1212 			short packets in mode 1.
1213 */
1214 
1215 #endif
1216 
1217 /* Service a Tx-Available or dma completion irq for the endpoint */
1218 void musb_host_tx(struct musb *musb, u8 epnum)
1219 {
1220 	int			pipe;
1221 	bool			done = false;
1222 	u16			tx_csr;
1223 	size_t			length = 0;
1224 	size_t			offset = 0;
1225 	struct musb_hw_ep	*hw_ep = musb->endpoints + epnum;
1226 	void __iomem		*epio = hw_ep->regs;
1227 	struct musb_qh		*qh = hw_ep->out_qh;
1228 	struct urb		*urb = next_urb(qh);
1229 	u32			status = 0;
1230 	void __iomem		*mbase = musb->mregs;
1231 	struct dma_channel	*dma;
1232 	bool			transfer_pending = false;
1233 
1234 	musb_ep_select(mbase, epnum);
1235 	tx_csr = musb_readw(epio, MUSB_TXCSR);
1236 
1237 	/* with CPPI, DMA sometimes triggers "extra" irqs */
1238 	if (!urb) {
1239 		musb_dbg(musb, "extra TX%d ready, csr %04x", epnum, tx_csr);
1240 		return;
1241 	}
1242 
1243 	pipe = urb->pipe;
1244 	dma = is_dma_capable() ? hw_ep->tx_channel : NULL;
1245 	trace_musb_urb_tx(musb, urb);
1246 	musb_dbg(musb, "OUT/TX%d end, csr %04x%s", epnum, tx_csr,
1247 			dma ? ", dma" : "");
1248 
1249 	/* check for errors */
1250 	if (tx_csr & MUSB_TXCSR_H_RXSTALL) {
1251 		/* dma was disabled, fifo flushed */
1252 		musb_dbg(musb, "TX end %d stall", epnum);
1253 
1254 		/* stall; record URB status */
1255 		status = -EPIPE;
1256 
1257 	} else if (tx_csr & MUSB_TXCSR_H_ERROR) {
1258 		/* (NON-ISO) dma was disabled, fifo flushed */
1259 		musb_dbg(musb, "TX 3strikes on ep=%d", epnum);
1260 
1261 		status = -ETIMEDOUT;
1262 
1263 	} else if (tx_csr & MUSB_TXCSR_H_NAKTIMEOUT) {
1264 		if (USB_ENDPOINT_XFER_BULK == qh->type && qh->mux == 1
1265 				&& !list_is_singular(&musb->out_bulk)) {
1266 			musb_dbg(musb, "NAK timeout on TX%d ep", epnum);
1267 			musb_bulk_nak_timeout(musb, hw_ep, 0);
1268 		} else {
1269 			musb_dbg(musb, "TX ep%d device not responding", epnum);
1270 			/* NOTE:  this code path would be a good place to PAUSE a
1271 			 * transfer, if there's some other (nonperiodic) tx urb
1272 			 * that could use this fifo.  (dma complicates it...)
1273 			 * That's already done for bulk RX transfers.
1274 			 *
1275 			 * if (bulk && qh->ring.next != &musb->out_bulk), then
1276 			 * we have a candidate... NAKing is *NOT* an error
1277 			 */
1278 			musb_ep_select(mbase, epnum);
1279 			musb_writew(epio, MUSB_TXCSR,
1280 					MUSB_TXCSR_H_WZC_BITS
1281 					| MUSB_TXCSR_TXPKTRDY);
1282 		}
1283 			return;
1284 	}
1285 
1286 done:
1287 	if (status) {
1288 		if (dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY) {
1289 			dma->status = MUSB_DMA_STATUS_CORE_ABORT;
1290 			musb->dma_controller->channel_abort(dma);
1291 		}
1292 
1293 		/* do the proper sequence to abort the transfer in the
1294 		 * usb core; the dma engine should already be stopped.
1295 		 */
1296 		musb_h_tx_flush_fifo(hw_ep);
1297 		tx_csr &= ~(MUSB_TXCSR_AUTOSET
1298 				| MUSB_TXCSR_DMAENAB
1299 				| MUSB_TXCSR_H_ERROR
1300 				| MUSB_TXCSR_H_RXSTALL
1301 				| MUSB_TXCSR_H_NAKTIMEOUT
1302 				);
1303 
1304 		musb_ep_select(mbase, epnum);
1305 		musb_writew(epio, MUSB_TXCSR, tx_csr);
1306 		/* REVISIT may need to clear FLUSHFIFO ... */
1307 		musb_writew(epio, MUSB_TXCSR, tx_csr);
1308 		musb_writeb(epio, MUSB_TXINTERVAL, 0);
1309 
1310 		done = true;
1311 	}
1312 
1313 	/* second cppi case */
1314 	if (dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY) {
1315 		musb_dbg(musb, "extra TX%d ready, csr %04x", epnum, tx_csr);
1316 		return;
1317 	}
1318 
1319 	if (is_dma_capable() && dma && !status) {
1320 		/*
1321 		 * DMA has completed.  But if we're using DMA mode 1 (multi
1322 		 * packet DMA), we need a terminal TXPKTRDY interrupt before
1323 		 * we can consider this transfer completed, lest we trash
1324 		 * its last packet when writing the next URB's data.  So we
1325 		 * switch back to mode 0 to get that interrupt; we'll come
1326 		 * back here once it happens.
1327 		 */
1328 		if (tx_csr & MUSB_TXCSR_DMAMODE) {
1329 			/*
1330 			 * We shouldn't clear DMAMODE with DMAENAB set; so
1331 			 * clear them in a safe order.  That should be OK
1332 			 * once TXPKTRDY has been set (and I've never seen
1333 			 * it being 0 at this moment -- DMA interrupt latency
1334 			 * is significant) but if it hasn't been then we have
1335 			 * no choice but to stop being polite and ignore the
1336 			 * programmer's guide... :-)
1337 			 *
1338 			 * Note that we must write TXCSR with TXPKTRDY cleared
1339 			 * in order not to re-trigger the packet send (this bit
1340 			 * can't be cleared by CPU), and there's another caveat:
1341 			 * TXPKTRDY may be set shortly and then cleared in the
1342 			 * double-buffered FIFO mode, so we do an extra TXCSR
1343 			 * read for debouncing...
1344 			 */
1345 			tx_csr &= musb_readw(epio, MUSB_TXCSR);
1346 			if (tx_csr & MUSB_TXCSR_TXPKTRDY) {
1347 				tx_csr &= ~(MUSB_TXCSR_DMAENAB |
1348 					    MUSB_TXCSR_TXPKTRDY);
1349 				musb_writew(epio, MUSB_TXCSR,
1350 					    tx_csr | MUSB_TXCSR_H_WZC_BITS);
1351 			}
1352 			tx_csr &= ~(MUSB_TXCSR_DMAMODE |
1353 				    MUSB_TXCSR_TXPKTRDY);
1354 			musb_writew(epio, MUSB_TXCSR,
1355 				    tx_csr | MUSB_TXCSR_H_WZC_BITS);
1356 
1357 			/*
1358 			 * There is no guarantee that we'll get an interrupt
1359 			 * after clearing DMAMODE as we might have done this
1360 			 * too late (after TXPKTRDY was cleared by controller).
1361 			 * Re-read TXCSR as we have spoiled its previous value.
1362 			 */
1363 			tx_csr = musb_readw(epio, MUSB_TXCSR);
1364 		}
1365 
1366 		/*
1367 		 * We may get here from a DMA completion or TXPKTRDY interrupt.
1368 		 * In any case, we must check the FIFO status here and bail out
1369 		 * only if the FIFO still has data -- that should prevent the
1370 		 * "missed" TXPKTRDY interrupts and deal with double-buffered
1371 		 * FIFO mode too...
1372 		 */
1373 		if (tx_csr & (MUSB_TXCSR_FIFONOTEMPTY | MUSB_TXCSR_TXPKTRDY)) {
1374 			musb_dbg(musb,
1375 				"DMA complete but FIFO not empty, CSR %04x",
1376 				tx_csr);
1377 			return;
1378 		}
1379 	}
1380 
1381 	if (!status || dma || usb_pipeisoc(pipe)) {
1382 		if (dma)
1383 			length = dma->actual_len;
1384 		else
1385 			length = qh->segsize;
1386 		qh->offset += length;
1387 
1388 		if (usb_pipeisoc(pipe)) {
1389 			struct usb_iso_packet_descriptor	*d;
1390 
1391 			d = urb->iso_frame_desc + qh->iso_idx;
1392 			d->actual_length = length;
1393 			d->status = status;
1394 			if (++qh->iso_idx >= urb->number_of_packets) {
1395 				done = true;
1396 			} else {
1397 				d++;
1398 				offset = d->offset;
1399 				length = d->length;
1400 			}
1401 		} else if (dma && urb->transfer_buffer_length == qh->offset) {
1402 			done = true;
1403 		} else {
1404 			/* see if we need to send more data, or ZLP */
1405 			if (qh->segsize < qh->maxpacket)
1406 				done = true;
1407 			else if (qh->offset == urb->transfer_buffer_length
1408 					&& !(urb->transfer_flags
1409 						& URB_ZERO_PACKET))
1410 				done = true;
1411 			if (!done) {
1412 				offset = qh->offset;
1413 				length = urb->transfer_buffer_length - offset;
1414 				transfer_pending = true;
1415 			}
1416 		}
1417 	}
1418 
1419 	/* urb->status != -EINPROGRESS means request has been faulted,
1420 	 * so we must abort this transfer after cleanup
1421 	 */
1422 	if (urb->status != -EINPROGRESS) {
1423 		done = true;
1424 		if (status == 0)
1425 			status = urb->status;
1426 	}
1427 
1428 	if (done) {
1429 		/* set status */
1430 		urb->status = status;
1431 		urb->actual_length = qh->offset;
1432 		musb_advance_schedule(musb, urb, hw_ep, USB_DIR_OUT);
1433 		return;
1434 	} else if ((usb_pipeisoc(pipe) || transfer_pending) && dma) {
1435 		if (musb_tx_dma_program(musb->dma_controller, hw_ep, qh, urb,
1436 				offset, length)) {
1437 			if (is_cppi_enabled(musb) || tusb_dma_omap(musb))
1438 				musb_h_tx_dma_start(hw_ep);
1439 			return;
1440 		}
1441 	} else	if (tx_csr & MUSB_TXCSR_DMAENAB) {
1442 		musb_dbg(musb, "not complete, but DMA enabled?");
1443 		return;
1444 	}
1445 
1446 	/*
1447 	 * PIO: start next packet in this URB.
1448 	 *
1449 	 * REVISIT: some docs say that when hw_ep->tx_double_buffered,
1450 	 * (and presumably, FIFO is not half-full) we should write *two*
1451 	 * packets before updating TXCSR; other docs disagree...
1452 	 */
1453 	if (length > qh->maxpacket)
1454 		length = qh->maxpacket;
1455 	/* Unmap the buffer so that CPU can use it */
1456 	usb_hcd_unmap_urb_for_dma(musb->hcd, urb);
1457 
1458 	/*
1459 	 * We need to map sg if the transfer_buffer is
1460 	 * NULL.
1461 	 */
1462 	if (!urb->transfer_buffer)
1463 		qh->use_sg = true;
1464 
1465 	if (qh->use_sg) {
1466 		/* sg_miter_start is already done in musb_ep_program */
1467 		if (!sg_miter_next(&qh->sg_miter)) {
1468 			dev_err(musb->controller, "error: sg list empty\n");
1469 			sg_miter_stop(&qh->sg_miter);
1470 			status = -EINVAL;
1471 			goto done;
1472 		}
1473 		urb->transfer_buffer = qh->sg_miter.addr;
1474 		length = min_t(u32, length, qh->sg_miter.length);
1475 		musb_write_fifo(hw_ep, length, urb->transfer_buffer);
1476 		qh->sg_miter.consumed = length;
1477 		sg_miter_stop(&qh->sg_miter);
1478 	} else {
1479 		musb_write_fifo(hw_ep, length, urb->transfer_buffer + offset);
1480 	}
1481 
1482 	qh->segsize = length;
1483 
1484 	if (qh->use_sg) {
1485 		if (offset + length >= urb->transfer_buffer_length)
1486 			qh->use_sg = false;
1487 	}
1488 
1489 	musb_ep_select(mbase, epnum);
1490 	musb_writew(epio, MUSB_TXCSR,
1491 			MUSB_TXCSR_H_WZC_BITS | MUSB_TXCSR_TXPKTRDY);
1492 }
1493 
1494 #ifdef CONFIG_USB_TI_CPPI41_DMA
1495 /* Seems to set up ISO for cppi41 and not advance len. See commit c57c41d */
1496 static int musb_rx_dma_iso_cppi41(struct dma_controller *dma,
1497 				  struct musb_hw_ep *hw_ep,
1498 				  struct musb_qh *qh,
1499 				  struct urb *urb,
1500 				  size_t len)
1501 {
1502 	struct dma_channel *channel = hw_ep->rx_channel;
1503 	void __iomem *epio = hw_ep->regs;
1504 	dma_addr_t *buf;
1505 	u32 length;
1506 	u16 val;
1507 
1508 	buf = (void *)urb->iso_frame_desc[qh->iso_idx].offset +
1509 		(u32)urb->transfer_dma;
1510 
1511 	length = urb->iso_frame_desc[qh->iso_idx].length;
1512 
1513 	val = musb_readw(epio, MUSB_RXCSR);
1514 	val |= MUSB_RXCSR_DMAENAB;
1515 	musb_writew(hw_ep->regs, MUSB_RXCSR, val);
1516 
1517 	return dma->channel_program(channel, qh->maxpacket, 0,
1518 				   (u32)buf, length);
1519 }
1520 #else
1521 static inline int musb_rx_dma_iso_cppi41(struct dma_controller *dma,
1522 					 struct musb_hw_ep *hw_ep,
1523 					 struct musb_qh *qh,
1524 					 struct urb *urb,
1525 					 size_t len)
1526 {
1527 	return false;
1528 }
1529 #endif
1530 
1531 #if defined(CONFIG_USB_INVENTRA_DMA) || defined(CONFIG_USB_UX500_DMA) || \
1532 	defined(CONFIG_USB_TI_CPPI41_DMA)
1533 /* Host side RX (IN) using Mentor DMA works as follows:
1534 	submit_urb ->
1535 		- if queue was empty, ProgramEndpoint
1536 		- first IN token is sent out (by setting ReqPkt)
1537 	LinuxIsr -> RxReady()
1538 	/\	=> first packet is received
1539 	|	- Set in mode 0 (DmaEnab, ~ReqPkt)
1540 	|		-> DMA Isr (transfer complete) -> RxReady()
1541 	|		    - Ack receive (~RxPktRdy), turn off DMA (~DmaEnab)
1542 	|		    - if urb not complete, send next IN token (ReqPkt)
1543 	|			   |		else complete urb.
1544 	|			   |
1545 	---------------------------
1546  *
1547  * Nuances of mode 1:
1548  *	For short packets, no ack (+RxPktRdy) is sent automatically
1549  *	(even if AutoClear is ON)
1550  *	For full packets, ack (~RxPktRdy) and next IN token (+ReqPkt) is sent
1551  *	automatically => major problem, as collecting the next packet becomes
1552  *	difficult. Hence mode 1 is not used.
1553  *
1554  * REVISIT
1555  *	All we care about at this driver level is that
1556  *       (a) all URBs terminate with REQPKT cleared and fifo(s) empty;
1557  *       (b) termination conditions are: short RX, or buffer full;
1558  *       (c) fault modes include
1559  *           - iff URB_SHORT_NOT_OK, short RX status is -EREMOTEIO.
1560  *             (and that endpoint's dma queue stops immediately)
1561  *           - overflow (full, PLUS more bytes in the terminal packet)
1562  *
1563  *	So for example, usb-storage sets URB_SHORT_NOT_OK, and would
1564  *	thus be a great candidate for using mode 1 ... for all but the
1565  *	last packet of one URB's transfer.
1566  */
1567 static int musb_rx_dma_inventra_cppi41(struct dma_controller *dma,
1568 				       struct musb_hw_ep *hw_ep,
1569 				       struct musb_qh *qh,
1570 				       struct urb *urb,
1571 				       size_t len)
1572 {
1573 	struct dma_channel *channel = hw_ep->rx_channel;
1574 	void __iomem *epio = hw_ep->regs;
1575 	u16 val;
1576 	int pipe;
1577 	bool done;
1578 
1579 	pipe = urb->pipe;
1580 
1581 	if (usb_pipeisoc(pipe)) {
1582 		struct usb_iso_packet_descriptor *d;
1583 
1584 		d = urb->iso_frame_desc + qh->iso_idx;
1585 		d->actual_length = len;
1586 
1587 		/* even if there was an error, we did the dma
1588 		 * for iso_frame_desc->length
1589 		 */
1590 		if (d->status != -EILSEQ && d->status != -EOVERFLOW)
1591 			d->status = 0;
1592 
1593 		if (++qh->iso_idx >= urb->number_of_packets) {
1594 			done = true;
1595 		} else {
1596 			/* REVISIT: Why ignore return value here? */
1597 			if (musb_dma_cppi41(hw_ep->musb))
1598 				done = musb_rx_dma_iso_cppi41(dma, hw_ep, qh,
1599 							      urb, len);
1600 			done = false;
1601 		}
1602 
1603 	} else  {
1604 		/* done if urb buffer is full or short packet is recd */
1605 		done = (urb->actual_length + len >=
1606 			urb->transfer_buffer_length
1607 			|| channel->actual_len < qh->maxpacket
1608 			|| channel->rx_packet_done);
1609 	}
1610 
1611 	/* send IN token for next packet, without AUTOREQ */
1612 	if (!done) {
1613 		val = musb_readw(epio, MUSB_RXCSR);
1614 		val |= MUSB_RXCSR_H_REQPKT;
1615 		musb_writew(epio, MUSB_RXCSR, MUSB_RXCSR_H_WZC_BITS | val);
1616 	}
1617 
1618 	return done;
1619 }
1620 
1621 /* Disadvantage of using mode 1:
1622  *	It's basically usable only for mass storage class; essentially all
1623  *	other protocols also terminate transfers on short packets.
1624  *
1625  * Details:
1626  *	An extra IN token is sent at the end of the transfer (due to AUTOREQ)
1627  *	If you try to use mode 1 for (transfer_buffer_length - 512), and try
1628  *	to use the extra IN token to grab the last packet using mode 0, then
1629  *	the problem is that you cannot be sure when the device will send the
1630  *	last packet and RxPktRdy set. Sometimes the packet is recd too soon
1631  *	such that it gets lost when RxCSR is re-set at the end of the mode 1
1632  *	transfer, while sometimes it is recd just a little late so that if you
1633  *	try to configure for mode 0 soon after the mode 1 transfer is
1634  *	completed, you will find rxcount 0. Okay, so you might think why not
1635  *	wait for an interrupt when the pkt is recd. Well, you won't get any!
1636  */
1637 static int musb_rx_dma_in_inventra_cppi41(struct dma_controller *dma,
1638 					  struct musb_hw_ep *hw_ep,
1639 					  struct musb_qh *qh,
1640 					  struct urb *urb,
1641 					  size_t len,
1642 					  u8 iso_err)
1643 {
1644 	struct musb *musb = hw_ep->musb;
1645 	void __iomem *epio = hw_ep->regs;
1646 	struct dma_channel *channel = hw_ep->rx_channel;
1647 	u16 rx_count, val;
1648 	int length, pipe, done;
1649 	dma_addr_t buf;
1650 
1651 	rx_count = musb_readw(epio, MUSB_RXCOUNT);
1652 	pipe = urb->pipe;
1653 
1654 	if (usb_pipeisoc(pipe)) {
1655 		int d_status = 0;
1656 		struct usb_iso_packet_descriptor *d;
1657 
1658 		d = urb->iso_frame_desc + qh->iso_idx;
1659 
1660 		if (iso_err) {
1661 			d_status = -EILSEQ;
1662 			urb->error_count++;
1663 		}
1664 		if (rx_count > d->length) {
1665 			if (d_status == 0) {
1666 				d_status = -EOVERFLOW;
1667 				urb->error_count++;
1668 			}
1669 			musb_dbg(musb, "** OVERFLOW %d into %d",
1670 				rx_count, d->length);
1671 
1672 			length = d->length;
1673 		} else
1674 			length = rx_count;
1675 		d->status = d_status;
1676 		buf = urb->transfer_dma + d->offset;
1677 	} else {
1678 		length = rx_count;
1679 		buf = urb->transfer_dma + urb->actual_length;
1680 	}
1681 
1682 	channel->desired_mode = 0;
1683 #ifdef USE_MODE1
1684 	/* because of the issue below, mode 1 will
1685 	 * only rarely behave with correct semantics.
1686 	 */
1687 	if ((urb->transfer_flags & URB_SHORT_NOT_OK)
1688 	    && (urb->transfer_buffer_length - urb->actual_length)
1689 	    > qh->maxpacket)
1690 		channel->desired_mode = 1;
1691 	if (rx_count < hw_ep->max_packet_sz_rx) {
1692 		length = rx_count;
1693 		channel->desired_mode = 0;
1694 	} else {
1695 		length = urb->transfer_buffer_length;
1696 	}
1697 #endif
1698 
1699 	/* See comments above on disadvantages of using mode 1 */
1700 	val = musb_readw(epio, MUSB_RXCSR);
1701 	val &= ~MUSB_RXCSR_H_REQPKT;
1702 
1703 	if (channel->desired_mode == 0)
1704 		val &= ~MUSB_RXCSR_H_AUTOREQ;
1705 	else
1706 		val |= MUSB_RXCSR_H_AUTOREQ;
1707 	val |= MUSB_RXCSR_DMAENAB;
1708 
1709 	/* autoclear shouldn't be set in high bandwidth */
1710 	if (qh->hb_mult == 1)
1711 		val |= MUSB_RXCSR_AUTOCLEAR;
1712 
1713 	musb_writew(epio, MUSB_RXCSR, MUSB_RXCSR_H_WZC_BITS | val);
1714 
1715 	/* REVISIT if when actual_length != 0,
1716 	 * transfer_buffer_length needs to be
1717 	 * adjusted first...
1718 	 */
1719 	done = dma->channel_program(channel, qh->maxpacket,
1720 				   channel->desired_mode,
1721 				   buf, length);
1722 
1723 	if (!done) {
1724 		dma->channel_release(channel);
1725 		hw_ep->rx_channel = NULL;
1726 		channel = NULL;
1727 		val = musb_readw(epio, MUSB_RXCSR);
1728 		val &= ~(MUSB_RXCSR_DMAENAB
1729 			 | MUSB_RXCSR_H_AUTOREQ
1730 			 | MUSB_RXCSR_AUTOCLEAR);
1731 		musb_writew(epio, MUSB_RXCSR, val);
1732 	}
1733 
1734 	return done;
1735 }
1736 #else
1737 static inline int musb_rx_dma_inventra_cppi41(struct dma_controller *dma,
1738 					      struct musb_hw_ep *hw_ep,
1739 					      struct musb_qh *qh,
1740 					      struct urb *urb,
1741 					      size_t len)
1742 {
1743 	return false;
1744 }
1745 
1746 static inline int musb_rx_dma_in_inventra_cppi41(struct dma_controller *dma,
1747 						 struct musb_hw_ep *hw_ep,
1748 						 struct musb_qh *qh,
1749 						 struct urb *urb,
1750 						 size_t len,
1751 						 u8 iso_err)
1752 {
1753 	return false;
1754 }
1755 #endif
1756 
1757 /*
1758  * Service an RX interrupt for the given IN endpoint; docs cover bulk, iso,
1759  * and high-bandwidth IN transfer cases.
1760  */
1761 void musb_host_rx(struct musb *musb, u8 epnum)
1762 {
1763 	struct urb		*urb;
1764 	struct musb_hw_ep	*hw_ep = musb->endpoints + epnum;
1765 	struct dma_controller	*c = musb->dma_controller;
1766 	void __iomem		*epio = hw_ep->regs;
1767 	struct musb_qh		*qh = hw_ep->in_qh;
1768 	size_t			xfer_len;
1769 	void __iomem		*mbase = musb->mregs;
1770 	u16			rx_csr, val;
1771 	bool			iso_err = false;
1772 	bool			done = false;
1773 	u32			status;
1774 	struct dma_channel	*dma;
1775 	unsigned int sg_flags = SG_MITER_ATOMIC | SG_MITER_TO_SG;
1776 
1777 	musb_ep_select(mbase, epnum);
1778 
1779 	urb = next_urb(qh);
1780 	dma = is_dma_capable() ? hw_ep->rx_channel : NULL;
1781 	status = 0;
1782 	xfer_len = 0;
1783 
1784 	rx_csr = musb_readw(epio, MUSB_RXCSR);
1785 	val = rx_csr;
1786 
1787 	if (unlikely(!urb)) {
1788 		/* REVISIT -- THIS SHOULD NEVER HAPPEN ... but, at least
1789 		 * usbtest #11 (unlinks) triggers it regularly, sometimes
1790 		 * with fifo full.  (Only with DMA??)
1791 		 */
1792 		musb_dbg(musb, "BOGUS RX%d ready, csr %04x, count %d",
1793 			epnum, val, musb_readw(epio, MUSB_RXCOUNT));
1794 		musb_h_flush_rxfifo(hw_ep, MUSB_RXCSR_CLRDATATOG);
1795 		return;
1796 	}
1797 
1798 	trace_musb_urb_rx(musb, urb);
1799 
1800 	/* check for errors, concurrent stall & unlink is not really
1801 	 * handled yet! */
1802 	if (rx_csr & MUSB_RXCSR_H_RXSTALL) {
1803 		musb_dbg(musb, "RX end %d STALL", epnum);
1804 
1805 		/* stall; record URB status */
1806 		status = -EPIPE;
1807 
1808 	} else if (rx_csr & MUSB_RXCSR_H_ERROR) {
1809 		musb_dbg(musb, "end %d RX proto error", epnum);
1810 
1811 		status = -EPROTO;
1812 		musb_writeb(epio, MUSB_RXINTERVAL, 0);
1813 
1814 		rx_csr &= ~MUSB_RXCSR_H_ERROR;
1815 		musb_writew(epio, MUSB_RXCSR, rx_csr);
1816 
1817 	} else if (rx_csr & MUSB_RXCSR_DATAERROR) {
1818 
1819 		if (USB_ENDPOINT_XFER_ISOC != qh->type) {
1820 			musb_dbg(musb, "RX end %d NAK timeout", epnum);
1821 
1822 			/* NOTE: NAKing is *NOT* an error, so we want to
1823 			 * continue.  Except ... if there's a request for
1824 			 * another QH, use that instead of starving it.
1825 			 *
1826 			 * Devices like Ethernet and serial adapters keep
1827 			 * reads posted at all times, which will starve
1828 			 * other devices without this logic.
1829 			 */
1830 			if (usb_pipebulk(urb->pipe)
1831 					&& qh->mux == 1
1832 					&& !list_is_singular(&musb->in_bulk)) {
1833 				musb_bulk_nak_timeout(musb, hw_ep, 1);
1834 				return;
1835 			}
1836 			musb_ep_select(mbase, epnum);
1837 			rx_csr |= MUSB_RXCSR_H_WZC_BITS;
1838 			rx_csr &= ~MUSB_RXCSR_DATAERROR;
1839 			musb_writew(epio, MUSB_RXCSR, rx_csr);
1840 
1841 			goto finish;
1842 		} else {
1843 			musb_dbg(musb, "RX end %d ISO data error", epnum);
1844 			/* packet error reported later */
1845 			iso_err = true;
1846 		}
1847 	} else if (rx_csr & MUSB_RXCSR_INCOMPRX) {
1848 		musb_dbg(musb, "end %d high bandwidth incomplete ISO packet RX",
1849 				epnum);
1850 		status = -EPROTO;
1851 	}
1852 
1853 	/* faults abort the transfer */
1854 	if (status) {
1855 		/* clean up dma and collect transfer count */
1856 		if (dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY) {
1857 			dma->status = MUSB_DMA_STATUS_CORE_ABORT;
1858 			musb->dma_controller->channel_abort(dma);
1859 			xfer_len = dma->actual_len;
1860 		}
1861 		musb_h_flush_rxfifo(hw_ep, MUSB_RXCSR_CLRDATATOG);
1862 		musb_writeb(epio, MUSB_RXINTERVAL, 0);
1863 		done = true;
1864 		goto finish;
1865 	}
1866 
1867 	if (unlikely(dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY)) {
1868 		/* SHOULD NEVER HAPPEN ... but at least DaVinci has done it */
1869 		ERR("RX%d dma busy, csr %04x\n", epnum, rx_csr);
1870 		goto finish;
1871 	}
1872 
1873 	/* thorough shutdown for now ... given more precise fault handling
1874 	 * and better queueing support, we might keep a DMA pipeline going
1875 	 * while processing this irq for earlier completions.
1876 	 */
1877 
1878 	/* FIXME this is _way_ too much in-line logic for Mentor DMA */
1879 	if (!musb_dma_inventra(musb) && !musb_dma_ux500(musb) &&
1880 	    (rx_csr & MUSB_RXCSR_H_REQPKT)) {
1881 		/* REVISIT this happened for a while on some short reads...
1882 		 * the cleanup still needs investigation... looks bad...
1883 		 * and also duplicates dma cleanup code above ... plus,
1884 		 * shouldn't this be the "half full" double buffer case?
1885 		 */
1886 		if (dma_channel_status(dma) == MUSB_DMA_STATUS_BUSY) {
1887 			dma->status = MUSB_DMA_STATUS_CORE_ABORT;
1888 			musb->dma_controller->channel_abort(dma);
1889 			xfer_len = dma->actual_len;
1890 			done = true;
1891 		}
1892 
1893 		musb_dbg(musb, "RXCSR%d %04x, reqpkt, len %zu%s", epnum, rx_csr,
1894 				xfer_len, dma ? ", dma" : "");
1895 		rx_csr &= ~MUSB_RXCSR_H_REQPKT;
1896 
1897 		musb_ep_select(mbase, epnum);
1898 		musb_writew(epio, MUSB_RXCSR,
1899 				MUSB_RXCSR_H_WZC_BITS | rx_csr);
1900 	}
1901 
1902 	if (dma && (rx_csr & MUSB_RXCSR_DMAENAB)) {
1903 		xfer_len = dma->actual_len;
1904 
1905 		val &= ~(MUSB_RXCSR_DMAENAB
1906 			| MUSB_RXCSR_H_AUTOREQ
1907 			| MUSB_RXCSR_AUTOCLEAR
1908 			| MUSB_RXCSR_RXPKTRDY);
1909 		musb_writew(hw_ep->regs, MUSB_RXCSR, val);
1910 
1911 		if (musb_dma_inventra(musb) || musb_dma_ux500(musb) ||
1912 		    musb_dma_cppi41(musb)) {
1913 			    done = musb_rx_dma_inventra_cppi41(c, hw_ep, qh, urb, xfer_len);
1914 			    musb_dbg(hw_ep->musb,
1915 				    "ep %d dma %s, rxcsr %04x, rxcount %d",
1916 				    epnum, done ? "off" : "reset",
1917 				    musb_readw(epio, MUSB_RXCSR),
1918 				    musb_readw(epio, MUSB_RXCOUNT));
1919 		} else {
1920 			done = true;
1921 		}
1922 
1923 	} else if (urb->status == -EINPROGRESS) {
1924 		/* if no errors, be sure a packet is ready for unloading */
1925 		if (unlikely(!(rx_csr & MUSB_RXCSR_RXPKTRDY))) {
1926 			status = -EPROTO;
1927 			ERR("Rx interrupt with no errors or packet!\n");
1928 
1929 			/* FIXME this is another "SHOULD NEVER HAPPEN" */
1930 
1931 /* SCRUB (RX) */
1932 			/* do the proper sequence to abort the transfer */
1933 			musb_ep_select(mbase, epnum);
1934 			val &= ~MUSB_RXCSR_H_REQPKT;
1935 			musb_writew(epio, MUSB_RXCSR, val);
1936 			goto finish;
1937 		}
1938 
1939 		/* we are expecting IN packets */
1940 		if ((musb_dma_inventra(musb) || musb_dma_ux500(musb) ||
1941 		    musb_dma_cppi41(musb)) && dma) {
1942 			musb_dbg(hw_ep->musb,
1943 				"RX%d count %d, buffer 0x%llx len %d/%d",
1944 				epnum, musb_readw(epio, MUSB_RXCOUNT),
1945 				(unsigned long long) urb->transfer_dma
1946 				+ urb->actual_length,
1947 				qh->offset,
1948 				urb->transfer_buffer_length);
1949 
1950 			if (musb_rx_dma_in_inventra_cppi41(c, hw_ep, qh, urb,
1951 							   xfer_len, iso_err))
1952 				goto finish;
1953 			else
1954 				dev_err(musb->controller, "error: rx_dma failed\n");
1955 		}
1956 
1957 		if (!dma) {
1958 			unsigned int received_len;
1959 
1960 			/* Unmap the buffer so that CPU can use it */
1961 			usb_hcd_unmap_urb_for_dma(musb->hcd, urb);
1962 
1963 			/*
1964 			 * We need to map sg if the transfer_buffer is
1965 			 * NULL.
1966 			 */
1967 			if (!urb->transfer_buffer) {
1968 				qh->use_sg = true;
1969 				sg_miter_start(&qh->sg_miter, urb->sg, 1,
1970 						sg_flags);
1971 			}
1972 
1973 			if (qh->use_sg) {
1974 				if (!sg_miter_next(&qh->sg_miter)) {
1975 					dev_err(musb->controller, "error: sg list empty\n");
1976 					sg_miter_stop(&qh->sg_miter);
1977 					status = -EINVAL;
1978 					done = true;
1979 					goto finish;
1980 				}
1981 				urb->transfer_buffer = qh->sg_miter.addr;
1982 				received_len = urb->actual_length;
1983 				qh->offset = 0x0;
1984 				done = musb_host_packet_rx(musb, urb, epnum,
1985 						iso_err);
1986 				/* Calculate the number of bytes received */
1987 				received_len = urb->actual_length -
1988 					received_len;
1989 				qh->sg_miter.consumed = received_len;
1990 				sg_miter_stop(&qh->sg_miter);
1991 			} else {
1992 				done = musb_host_packet_rx(musb, urb,
1993 						epnum, iso_err);
1994 			}
1995 			musb_dbg(musb, "read %spacket", done ? "last " : "");
1996 		}
1997 	}
1998 
1999 finish:
2000 	urb->actual_length += xfer_len;
2001 	qh->offset += xfer_len;
2002 	if (done) {
2003 		if (qh->use_sg)
2004 			qh->use_sg = false;
2005 
2006 		if (urb->status == -EINPROGRESS)
2007 			urb->status = status;
2008 		musb_advance_schedule(musb, urb, hw_ep, USB_DIR_IN);
2009 	}
2010 }
2011 
2012 /* schedule nodes correspond to peripheral endpoints, like an OHCI QH.
2013  * the software schedule associates multiple such nodes with a given
2014  * host side hardware endpoint + direction; scheduling may activate
2015  * that hardware endpoint.
2016  */
2017 static int musb_schedule(
2018 	struct musb		*musb,
2019 	struct musb_qh		*qh,
2020 	int			is_in)
2021 {
2022 	int			idle = 0;
2023 	int			best_diff;
2024 	int			best_end, epnum;
2025 	struct musb_hw_ep	*hw_ep = NULL;
2026 	struct list_head	*head = NULL;
2027 	u8			toggle;
2028 	u8			txtype;
2029 	struct urb		*urb = next_urb(qh);
2030 
2031 	/* use fixed hardware for control and bulk */
2032 	if (qh->type == USB_ENDPOINT_XFER_CONTROL) {
2033 		head = &musb->control;
2034 		hw_ep = musb->control_ep;
2035 		goto success;
2036 	}
2037 
2038 	/* else, periodic transfers get muxed to other endpoints */
2039 
2040 	/*
2041 	 * We know this qh hasn't been scheduled, so all we need to do
2042 	 * is choose which hardware endpoint to put it on ...
2043 	 *
2044 	 * REVISIT what we really want here is a regular schedule tree
2045 	 * like e.g. OHCI uses.
2046 	 */
2047 	best_diff = 4096;
2048 	best_end = -1;
2049 
2050 	for (epnum = 1, hw_ep = musb->endpoints + 1;
2051 			epnum < musb->nr_endpoints;
2052 			epnum++, hw_ep++) {
2053 		int	diff;
2054 
2055 		if (musb_ep_get_qh(hw_ep, is_in) != NULL)
2056 			continue;
2057 
2058 		if (hw_ep == musb->bulk_ep)
2059 			continue;
2060 
2061 		if (is_in)
2062 			diff = hw_ep->max_packet_sz_rx;
2063 		else
2064 			diff = hw_ep->max_packet_sz_tx;
2065 		diff -= (qh->maxpacket * qh->hb_mult);
2066 
2067 		if (diff >= 0 && best_diff > diff) {
2068 
2069 			/*
2070 			 * Mentor controller has a bug in that if we schedule
2071 			 * a BULK Tx transfer on an endpoint that had earlier
2072 			 * handled ISOC then the BULK transfer has to start on
2073 			 * a zero toggle.  If the BULK transfer starts on a 1
2074 			 * toggle then this transfer will fail as the mentor
2075 			 * controller starts the Bulk transfer on a 0 toggle
2076 			 * irrespective of the programming of the toggle bits
2077 			 * in the TXCSR register.  Check for this condition
2078 			 * while allocating the EP for a Tx Bulk transfer.  If
2079 			 * so skip this EP.
2080 			 */
2081 			hw_ep = musb->endpoints + epnum;
2082 			toggle = usb_gettoggle(urb->dev, qh->epnum, !is_in);
2083 			txtype = (musb_readb(hw_ep->regs, MUSB_TXTYPE)
2084 					>> 4) & 0x3;
2085 			if (!is_in && (qh->type == USB_ENDPOINT_XFER_BULK) &&
2086 				toggle && (txtype == USB_ENDPOINT_XFER_ISOC))
2087 				continue;
2088 
2089 			best_diff = diff;
2090 			best_end = epnum;
2091 		}
2092 	}
2093 	/* use bulk reserved ep1 if no other ep is free */
2094 	if (best_end < 0 && qh->type == USB_ENDPOINT_XFER_BULK) {
2095 		hw_ep = musb->bulk_ep;
2096 		if (is_in)
2097 			head = &musb->in_bulk;
2098 		else
2099 			head = &musb->out_bulk;
2100 
2101 		/* Enable bulk RX/TX NAK timeout scheme when bulk requests are
2102 		 * multiplexed. This scheme does not work in high speed to full
2103 		 * speed scenario as NAK interrupts are not coming from a
2104 		 * full speed device connected to a high speed device.
2105 		 * NAK timeout interval is 8 (128 uframe or 16ms) for HS and
2106 		 * 4 (8 frame or 8ms) for FS device.
2107 		 */
2108 		if (qh->dev)
2109 			qh->intv_reg =
2110 				(USB_SPEED_HIGH == qh->dev->speed) ? 8 : 4;
2111 		goto success;
2112 	} else if (best_end < 0) {
2113 		dev_err(musb->controller,
2114 				"%s hwep alloc failed for %dx%d\n",
2115 				musb_ep_xfertype_string(qh->type),
2116 				qh->hb_mult, qh->maxpacket);
2117 		return -ENOSPC;
2118 	}
2119 
2120 	idle = 1;
2121 	qh->mux = 0;
2122 	hw_ep = musb->endpoints + best_end;
2123 	musb_dbg(musb, "qh %p periodic slot %d", qh, best_end);
2124 success:
2125 	if (head) {
2126 		idle = list_empty(head);
2127 		list_add_tail(&qh->ring, head);
2128 		qh->mux = 1;
2129 	}
2130 	qh->hw_ep = hw_ep;
2131 	qh->hep->hcpriv = qh;
2132 	if (idle)
2133 		musb_start_urb(musb, is_in, qh);
2134 	return 0;
2135 }
2136 
2137 static int musb_urb_enqueue(
2138 	struct usb_hcd			*hcd,
2139 	struct urb			*urb,
2140 	gfp_t				mem_flags)
2141 {
2142 	unsigned long			flags;
2143 	struct musb			*musb = hcd_to_musb(hcd);
2144 	struct usb_host_endpoint	*hep = urb->ep;
2145 	struct musb_qh			*qh;
2146 	struct usb_endpoint_descriptor	*epd = &hep->desc;
2147 	int				ret;
2148 	unsigned			type_reg;
2149 	unsigned			interval;
2150 
2151 	/* host role must be active */
2152 	if (!is_host_active(musb) || !musb->is_active)
2153 		return -ENODEV;
2154 
2155 	trace_musb_urb_enq(musb, urb);
2156 
2157 	spin_lock_irqsave(&musb->lock, flags);
2158 	ret = usb_hcd_link_urb_to_ep(hcd, urb);
2159 	qh = ret ? NULL : hep->hcpriv;
2160 	if (qh)
2161 		urb->hcpriv = qh;
2162 	spin_unlock_irqrestore(&musb->lock, flags);
2163 
2164 	/* DMA mapping was already done, if needed, and this urb is on
2165 	 * hep->urb_list now ... so we're done, unless hep wasn't yet
2166 	 * scheduled onto a live qh.
2167 	 *
2168 	 * REVISIT best to keep hep->hcpriv valid until the endpoint gets
2169 	 * disabled, testing for empty qh->ring and avoiding qh setup costs
2170 	 * except for the first urb queued after a config change.
2171 	 */
2172 	if (qh || ret)
2173 		return ret;
2174 
2175 	/* Allocate and initialize qh, minimizing the work done each time
2176 	 * hw_ep gets reprogrammed, or with irqs blocked.  Then schedule it.
2177 	 *
2178 	 * REVISIT consider a dedicated qh kmem_cache, so it's harder
2179 	 * for bugs in other kernel code to break this driver...
2180 	 */
2181 	qh = kzalloc(sizeof *qh, mem_flags);
2182 	if (!qh) {
2183 		spin_lock_irqsave(&musb->lock, flags);
2184 		usb_hcd_unlink_urb_from_ep(hcd, urb);
2185 		spin_unlock_irqrestore(&musb->lock, flags);
2186 		return -ENOMEM;
2187 	}
2188 
2189 	qh->hep = hep;
2190 	qh->dev = urb->dev;
2191 	INIT_LIST_HEAD(&qh->ring);
2192 	qh->is_ready = 1;
2193 
2194 	qh->maxpacket = usb_endpoint_maxp(epd);
2195 	qh->type = usb_endpoint_type(epd);
2196 
2197 	/* Bits 11 & 12 of wMaxPacketSize encode high bandwidth multiplier.
2198 	 * Some musb cores don't support high bandwidth ISO transfers; and
2199 	 * we don't (yet!) support high bandwidth interrupt transfers.
2200 	 */
2201 	qh->hb_mult = usb_endpoint_maxp_mult(epd);
2202 	if (qh->hb_mult > 1) {
2203 		int ok = (qh->type == USB_ENDPOINT_XFER_ISOC);
2204 
2205 		if (ok)
2206 			ok = (usb_pipein(urb->pipe) && musb->hb_iso_rx)
2207 				|| (usb_pipeout(urb->pipe) && musb->hb_iso_tx);
2208 		if (!ok) {
2209 			dev_err(musb->controller,
2210 				"high bandwidth %s (%dx%d) not supported\n",
2211 				musb_ep_xfertype_string(qh->type),
2212 				qh->hb_mult, qh->maxpacket & 0x7ff);
2213 			ret = -EMSGSIZE;
2214 			goto done;
2215 		}
2216 		qh->maxpacket &= 0x7ff;
2217 	}
2218 
2219 	qh->epnum = usb_endpoint_num(epd);
2220 
2221 	/* NOTE: urb->dev->devnum is wrong during SET_ADDRESS */
2222 	qh->addr_reg = (u8) usb_pipedevice(urb->pipe);
2223 
2224 	/* precompute rxtype/txtype/type0 register */
2225 	type_reg = (qh->type << 4) | qh->epnum;
2226 	switch (urb->dev->speed) {
2227 	case USB_SPEED_LOW:
2228 		type_reg |= 0xc0;
2229 		break;
2230 	case USB_SPEED_FULL:
2231 		type_reg |= 0x80;
2232 		break;
2233 	default:
2234 		type_reg |= 0x40;
2235 	}
2236 	qh->type_reg = type_reg;
2237 
2238 	/* Precompute RXINTERVAL/TXINTERVAL register */
2239 	switch (qh->type) {
2240 	case USB_ENDPOINT_XFER_INT:
2241 		/*
2242 		 * Full/low speeds use the  linear encoding,
2243 		 * high speed uses the logarithmic encoding.
2244 		 */
2245 		if (urb->dev->speed <= USB_SPEED_FULL) {
2246 			interval = max_t(u8, epd->bInterval, 1);
2247 			break;
2248 		}
2249 		/* FALLTHROUGH */
2250 	case USB_ENDPOINT_XFER_ISOC:
2251 		/* ISO always uses logarithmic encoding */
2252 		interval = min_t(u8, epd->bInterval, 16);
2253 		break;
2254 	default:
2255 		/* REVISIT we actually want to use NAK limits, hinting to the
2256 		 * transfer scheduling logic to try some other qh, e.g. try
2257 		 * for 2 msec first:
2258 		 *
2259 		 * interval = (USB_SPEED_HIGH == urb->dev->speed) ? 16 : 2;
2260 		 *
2261 		 * The downside of disabling this is that transfer scheduling
2262 		 * gets VERY unfair for nonperiodic transfers; a misbehaving
2263 		 * peripheral could make that hurt.  That's perfectly normal
2264 		 * for reads from network or serial adapters ... so we have
2265 		 * partial NAKlimit support for bulk RX.
2266 		 *
2267 		 * The upside of disabling it is simpler transfer scheduling.
2268 		 */
2269 		interval = 0;
2270 	}
2271 	qh->intv_reg = interval;
2272 
2273 	/* precompute addressing for external hub/tt ports */
2274 	if (musb->is_multipoint) {
2275 		struct usb_device	*parent = urb->dev->parent;
2276 
2277 		if (parent != hcd->self.root_hub) {
2278 			qh->h_addr_reg = (u8) parent->devnum;
2279 
2280 			/* set up tt info if needed */
2281 			if (urb->dev->tt) {
2282 				qh->h_port_reg = (u8) urb->dev->ttport;
2283 				if (urb->dev->tt->hub)
2284 					qh->h_addr_reg =
2285 						(u8) urb->dev->tt->hub->devnum;
2286 				if (urb->dev->tt->multi)
2287 					qh->h_addr_reg |= 0x80;
2288 			}
2289 		}
2290 	}
2291 
2292 	/* invariant: hep->hcpriv is null OR the qh that's already scheduled.
2293 	 * until we get real dma queues (with an entry for each urb/buffer),
2294 	 * we only have work to do in the former case.
2295 	 */
2296 	spin_lock_irqsave(&musb->lock, flags);
2297 	if (hep->hcpriv || !next_urb(qh)) {
2298 		/* some concurrent activity submitted another urb to hep...
2299 		 * odd, rare, error prone, but legal.
2300 		 */
2301 		kfree(qh);
2302 		qh = NULL;
2303 		ret = 0;
2304 	} else
2305 		ret = musb_schedule(musb, qh,
2306 				epd->bEndpointAddress & USB_ENDPOINT_DIR_MASK);
2307 
2308 	if (ret == 0) {
2309 		urb->hcpriv = qh;
2310 		/* FIXME set urb->start_frame for iso/intr, it's tested in
2311 		 * musb_start_urb(), but otherwise only konicawc cares ...
2312 		 */
2313 	}
2314 	spin_unlock_irqrestore(&musb->lock, flags);
2315 
2316 done:
2317 	if (ret != 0) {
2318 		spin_lock_irqsave(&musb->lock, flags);
2319 		usb_hcd_unlink_urb_from_ep(hcd, urb);
2320 		spin_unlock_irqrestore(&musb->lock, flags);
2321 		kfree(qh);
2322 	}
2323 	return ret;
2324 }
2325 
2326 
2327 /*
2328  * abort a transfer that's at the head of a hardware queue.
2329  * called with controller locked, irqs blocked
2330  * that hardware queue advances to the next transfer, unless prevented
2331  */
2332 static int musb_cleanup_urb(struct urb *urb, struct musb_qh *qh)
2333 {
2334 	struct musb_hw_ep	*ep = qh->hw_ep;
2335 	struct musb		*musb = ep->musb;
2336 	void __iomem		*epio = ep->regs;
2337 	unsigned		hw_end = ep->epnum;
2338 	void __iomem		*regs = ep->musb->mregs;
2339 	int			is_in = usb_pipein(urb->pipe);
2340 	int			status = 0;
2341 	u16			csr;
2342 	struct dma_channel	*dma = NULL;
2343 
2344 	musb_ep_select(regs, hw_end);
2345 
2346 	if (is_dma_capable()) {
2347 		dma = is_in ? ep->rx_channel : ep->tx_channel;
2348 		if (dma) {
2349 			status = ep->musb->dma_controller->channel_abort(dma);
2350 			musb_dbg(musb, "abort %cX%d DMA for urb %p --> %d",
2351 				is_in ? 'R' : 'T', ep->epnum,
2352 				urb, status);
2353 			urb->actual_length += dma->actual_len;
2354 		}
2355 	}
2356 
2357 	/* turn off DMA requests, discard state, stop polling ... */
2358 	if (ep->epnum && is_in) {
2359 		/* giveback saves bulk toggle */
2360 		csr = musb_h_flush_rxfifo(ep, 0);
2361 
2362 		/* clear the endpoint's irq status here to avoid bogus irqs */
2363 		if (is_dma_capable() && dma)
2364 			musb_platform_clear_ep_rxintr(musb, ep->epnum);
2365 	} else if (ep->epnum) {
2366 		musb_h_tx_flush_fifo(ep);
2367 		csr = musb_readw(epio, MUSB_TXCSR);
2368 		csr &= ~(MUSB_TXCSR_AUTOSET
2369 			| MUSB_TXCSR_DMAENAB
2370 			| MUSB_TXCSR_H_RXSTALL
2371 			| MUSB_TXCSR_H_NAKTIMEOUT
2372 			| MUSB_TXCSR_H_ERROR
2373 			| MUSB_TXCSR_TXPKTRDY);
2374 		musb_writew(epio, MUSB_TXCSR, csr);
2375 		/* REVISIT may need to clear FLUSHFIFO ... */
2376 		musb_writew(epio, MUSB_TXCSR, csr);
2377 		/* flush cpu writebuffer */
2378 		csr = musb_readw(epio, MUSB_TXCSR);
2379 	} else  {
2380 		musb_h_ep0_flush_fifo(ep);
2381 	}
2382 	if (status == 0)
2383 		musb_advance_schedule(ep->musb, urb, ep, is_in);
2384 	return status;
2385 }
2386 
2387 static int musb_urb_dequeue(struct usb_hcd *hcd, struct urb *urb, int status)
2388 {
2389 	struct musb		*musb = hcd_to_musb(hcd);
2390 	struct musb_qh		*qh;
2391 	unsigned long		flags;
2392 	int			is_in  = usb_pipein(urb->pipe);
2393 	int			ret;
2394 
2395 	trace_musb_urb_deq(musb, urb);
2396 
2397 	spin_lock_irqsave(&musb->lock, flags);
2398 	ret = usb_hcd_check_unlink_urb(hcd, urb, status);
2399 	if (ret)
2400 		goto done;
2401 
2402 	qh = urb->hcpriv;
2403 	if (!qh)
2404 		goto done;
2405 
2406 	/*
2407 	 * Any URB not actively programmed into endpoint hardware can be
2408 	 * immediately given back; that's any URB not at the head of an
2409 	 * endpoint queue, unless someday we get real DMA queues.  And even
2410 	 * if it's at the head, it might not be known to the hardware...
2411 	 *
2412 	 * Otherwise abort current transfer, pending DMA, etc.; urb->status
2413 	 * has already been updated.  This is a synchronous abort; it'd be
2414 	 * OK to hold off until after some IRQ, though.
2415 	 *
2416 	 * NOTE: qh is invalid unless !list_empty(&hep->urb_list)
2417 	 */
2418 	if (!qh->is_ready
2419 			|| urb->urb_list.prev != &qh->hep->urb_list
2420 			|| musb_ep_get_qh(qh->hw_ep, is_in) != qh) {
2421 		int	ready = qh->is_ready;
2422 
2423 		qh->is_ready = 0;
2424 		musb_giveback(musb, urb, 0);
2425 		qh->is_ready = ready;
2426 
2427 		/* If nothing else (usually musb_giveback) is using it
2428 		 * and its URB list has emptied, recycle this qh.
2429 		 */
2430 		if (ready && list_empty(&qh->hep->urb_list)) {
2431 			qh->hep->hcpriv = NULL;
2432 			list_del(&qh->ring);
2433 			kfree(qh);
2434 		}
2435 	} else
2436 		ret = musb_cleanup_urb(urb, qh);
2437 done:
2438 	spin_unlock_irqrestore(&musb->lock, flags);
2439 	return ret;
2440 }
2441 
2442 /* disable an endpoint */
2443 static void
2444 musb_h_disable(struct usb_hcd *hcd, struct usb_host_endpoint *hep)
2445 {
2446 	u8			is_in = hep->desc.bEndpointAddress & USB_DIR_IN;
2447 	unsigned long		flags;
2448 	struct musb		*musb = hcd_to_musb(hcd);
2449 	struct musb_qh		*qh;
2450 	struct urb		*urb;
2451 
2452 	spin_lock_irqsave(&musb->lock, flags);
2453 
2454 	qh = hep->hcpriv;
2455 	if (qh == NULL)
2456 		goto exit;
2457 
2458 	/* NOTE: qh is invalid unless !list_empty(&hep->urb_list) */
2459 
2460 	/* Kick the first URB off the hardware, if needed */
2461 	qh->is_ready = 0;
2462 	if (musb_ep_get_qh(qh->hw_ep, is_in) == qh) {
2463 		urb = next_urb(qh);
2464 
2465 		/* make software (then hardware) stop ASAP */
2466 		if (!urb->unlinked)
2467 			urb->status = -ESHUTDOWN;
2468 
2469 		/* cleanup */
2470 		musb_cleanup_urb(urb, qh);
2471 
2472 		/* Then nuke all the others ... and advance the
2473 		 * queue on hw_ep (e.g. bulk ring) when we're done.
2474 		 */
2475 		while (!list_empty(&hep->urb_list)) {
2476 			urb = next_urb(qh);
2477 			urb->status = -ESHUTDOWN;
2478 			musb_advance_schedule(musb, urb, qh->hw_ep, is_in);
2479 		}
2480 	} else {
2481 		/* Just empty the queue; the hardware is busy with
2482 		 * other transfers, and since !qh->is_ready nothing
2483 		 * will activate any of these as it advances.
2484 		 */
2485 		while (!list_empty(&hep->urb_list))
2486 			musb_giveback(musb, next_urb(qh), -ESHUTDOWN);
2487 
2488 		hep->hcpriv = NULL;
2489 		list_del(&qh->ring);
2490 		kfree(qh);
2491 	}
2492 exit:
2493 	spin_unlock_irqrestore(&musb->lock, flags);
2494 }
2495 
2496 static int musb_h_get_frame_number(struct usb_hcd *hcd)
2497 {
2498 	struct musb	*musb = hcd_to_musb(hcd);
2499 
2500 	return musb_readw(musb->mregs, MUSB_FRAME);
2501 }
2502 
2503 static int musb_h_start(struct usb_hcd *hcd)
2504 {
2505 	struct musb	*musb = hcd_to_musb(hcd);
2506 
2507 	/* NOTE: musb_start() is called when the hub driver turns
2508 	 * on port power, or when (OTG) peripheral starts.
2509 	 */
2510 	hcd->state = HC_STATE_RUNNING;
2511 	musb->port1_status = 0;
2512 	return 0;
2513 }
2514 
2515 static void musb_h_stop(struct usb_hcd *hcd)
2516 {
2517 	musb_stop(hcd_to_musb(hcd));
2518 	hcd->state = HC_STATE_HALT;
2519 }
2520 
2521 static int musb_bus_suspend(struct usb_hcd *hcd)
2522 {
2523 	struct musb	*musb = hcd_to_musb(hcd);
2524 	u8		devctl;
2525 
2526 	musb_port_suspend(musb, true);
2527 
2528 	if (!is_host_active(musb))
2529 		return 0;
2530 
2531 	switch (musb->xceiv->otg->state) {
2532 	case OTG_STATE_A_SUSPEND:
2533 		return 0;
2534 	case OTG_STATE_A_WAIT_VRISE:
2535 		/* ID could be grounded even if there's no device
2536 		 * on the other end of the cable.  NOTE that the
2537 		 * A_WAIT_VRISE timers are messy with MUSB...
2538 		 */
2539 		devctl = musb_readb(musb->mregs, MUSB_DEVCTL);
2540 		if ((devctl & MUSB_DEVCTL_VBUS) == MUSB_DEVCTL_VBUS)
2541 			musb->xceiv->otg->state = OTG_STATE_A_WAIT_BCON;
2542 		break;
2543 	default:
2544 		break;
2545 	}
2546 
2547 	if (musb->is_active) {
2548 		WARNING("trying to suspend as %s while active\n",
2549 				usb_otg_state_string(musb->xceiv->otg->state));
2550 		return -EBUSY;
2551 	} else
2552 		return 0;
2553 }
2554 
2555 static int musb_bus_resume(struct usb_hcd *hcd)
2556 {
2557 	struct musb *musb = hcd_to_musb(hcd);
2558 
2559 	if (musb->config &&
2560 	    musb->config->host_port_deassert_reset_at_resume)
2561 		musb_port_reset(musb, false);
2562 
2563 	return 0;
2564 }
2565 
2566 #ifndef CONFIG_MUSB_PIO_ONLY
2567 
2568 #define MUSB_USB_DMA_ALIGN 4
2569 
2570 struct musb_temp_buffer {
2571 	void *kmalloc_ptr;
2572 	void *old_xfer_buffer;
2573 	u8 data[0];
2574 };
2575 
2576 static void musb_free_temp_buffer(struct urb *urb)
2577 {
2578 	enum dma_data_direction dir;
2579 	struct musb_temp_buffer *temp;
2580 	size_t length;
2581 
2582 	if (!(urb->transfer_flags & URB_ALIGNED_TEMP_BUFFER))
2583 		return;
2584 
2585 	dir = usb_urb_dir_in(urb) ? DMA_FROM_DEVICE : DMA_TO_DEVICE;
2586 
2587 	temp = container_of(urb->transfer_buffer, struct musb_temp_buffer,
2588 			    data);
2589 
2590 	if (dir == DMA_FROM_DEVICE) {
2591 		if (usb_pipeisoc(urb->pipe))
2592 			length = urb->transfer_buffer_length;
2593 		else
2594 			length = urb->actual_length;
2595 
2596 		memcpy(temp->old_xfer_buffer, temp->data, length);
2597 	}
2598 	urb->transfer_buffer = temp->old_xfer_buffer;
2599 	kfree(temp->kmalloc_ptr);
2600 
2601 	urb->transfer_flags &= ~URB_ALIGNED_TEMP_BUFFER;
2602 }
2603 
2604 static int musb_alloc_temp_buffer(struct urb *urb, gfp_t mem_flags)
2605 {
2606 	enum dma_data_direction dir;
2607 	struct musb_temp_buffer *temp;
2608 	void *kmalloc_ptr;
2609 	size_t kmalloc_size;
2610 
2611 	if (urb->num_sgs || urb->sg ||
2612 	    urb->transfer_buffer_length == 0 ||
2613 	    !((uintptr_t)urb->transfer_buffer & (MUSB_USB_DMA_ALIGN - 1)))
2614 		return 0;
2615 
2616 	dir = usb_urb_dir_in(urb) ? DMA_FROM_DEVICE : DMA_TO_DEVICE;
2617 
2618 	/* Allocate a buffer with enough padding for alignment */
2619 	kmalloc_size = urb->transfer_buffer_length +
2620 		sizeof(struct musb_temp_buffer) + MUSB_USB_DMA_ALIGN - 1;
2621 
2622 	kmalloc_ptr = kmalloc(kmalloc_size, mem_flags);
2623 	if (!kmalloc_ptr)
2624 		return -ENOMEM;
2625 
2626 	/* Position our struct temp_buffer such that data is aligned */
2627 	temp = PTR_ALIGN(kmalloc_ptr, MUSB_USB_DMA_ALIGN);
2628 
2629 
2630 	temp->kmalloc_ptr = kmalloc_ptr;
2631 	temp->old_xfer_buffer = urb->transfer_buffer;
2632 	if (dir == DMA_TO_DEVICE)
2633 		memcpy(temp->data, urb->transfer_buffer,
2634 		       urb->transfer_buffer_length);
2635 	urb->transfer_buffer = temp->data;
2636 
2637 	urb->transfer_flags |= URB_ALIGNED_TEMP_BUFFER;
2638 
2639 	return 0;
2640 }
2641 
2642 static int musb_map_urb_for_dma(struct usb_hcd *hcd, struct urb *urb,
2643 				      gfp_t mem_flags)
2644 {
2645 	struct musb	*musb = hcd_to_musb(hcd);
2646 	int ret;
2647 
2648 	/*
2649 	 * The DMA engine in RTL1.8 and above cannot handle
2650 	 * DMA addresses that are not aligned to a 4 byte boundary.
2651 	 * For such engine implemented (un)map_urb_for_dma hooks.
2652 	 * Do not use these hooks for RTL<1.8
2653 	 */
2654 	if (musb->hwvers < MUSB_HWVERS_1800)
2655 		return usb_hcd_map_urb_for_dma(hcd, urb, mem_flags);
2656 
2657 	ret = musb_alloc_temp_buffer(urb, mem_flags);
2658 	if (ret)
2659 		return ret;
2660 
2661 	ret = usb_hcd_map_urb_for_dma(hcd, urb, mem_flags);
2662 	if (ret)
2663 		musb_free_temp_buffer(urb);
2664 
2665 	return ret;
2666 }
2667 
2668 static void musb_unmap_urb_for_dma(struct usb_hcd *hcd, struct urb *urb)
2669 {
2670 	struct musb	*musb = hcd_to_musb(hcd);
2671 
2672 	usb_hcd_unmap_urb_for_dma(hcd, urb);
2673 
2674 	/* Do not use this hook for RTL<1.8 (see description above) */
2675 	if (musb->hwvers < MUSB_HWVERS_1800)
2676 		return;
2677 
2678 	musb_free_temp_buffer(urb);
2679 }
2680 #endif /* !CONFIG_MUSB_PIO_ONLY */
2681 
2682 static const struct hc_driver musb_hc_driver = {
2683 	.description		= "musb-hcd",
2684 	.product_desc		= "MUSB HDRC host driver",
2685 	.hcd_priv_size		= sizeof(struct musb *),
2686 	.flags			= HCD_USB2 | HCD_MEMORY,
2687 
2688 	/* not using irq handler or reset hooks from usbcore, since
2689 	 * those must be shared with peripheral code for OTG configs
2690 	 */
2691 
2692 	.start			= musb_h_start,
2693 	.stop			= musb_h_stop,
2694 
2695 	.get_frame_number	= musb_h_get_frame_number,
2696 
2697 	.urb_enqueue		= musb_urb_enqueue,
2698 	.urb_dequeue		= musb_urb_dequeue,
2699 	.endpoint_disable	= musb_h_disable,
2700 
2701 #ifndef CONFIG_MUSB_PIO_ONLY
2702 	.map_urb_for_dma	= musb_map_urb_for_dma,
2703 	.unmap_urb_for_dma	= musb_unmap_urb_for_dma,
2704 #endif
2705 
2706 	.hub_status_data	= musb_hub_status_data,
2707 	.hub_control		= musb_hub_control,
2708 	.bus_suspend		= musb_bus_suspend,
2709 	.bus_resume		= musb_bus_resume,
2710 	/* .start_port_reset	= NULL, */
2711 	/* .hub_irq_enable	= NULL, */
2712 };
2713 
2714 int musb_host_alloc(struct musb *musb)
2715 {
2716 	struct device	*dev = musb->controller;
2717 
2718 	/* usbcore sets dev->driver_data to hcd, and sometimes uses that... */
2719 	musb->hcd = usb_create_hcd(&musb_hc_driver, dev, dev_name(dev));
2720 	if (!musb->hcd)
2721 		return -EINVAL;
2722 
2723 	*musb->hcd->hcd_priv = (unsigned long) musb;
2724 	musb->hcd->self.uses_pio_for_control = 1;
2725 	musb->hcd->uses_new_polling = 1;
2726 	musb->hcd->has_tt = 1;
2727 
2728 	return 0;
2729 }
2730 
2731 void musb_host_cleanup(struct musb *musb)
2732 {
2733 	if (musb->port_mode == MUSB_PORT_MODE_GADGET)
2734 		return;
2735 	usb_remove_hcd(musb->hcd);
2736 }
2737 
2738 void musb_host_free(struct musb *musb)
2739 {
2740 	usb_put_hcd(musb->hcd);
2741 }
2742 
2743 int musb_host_setup(struct musb *musb, int power_budget)
2744 {
2745 	int ret;
2746 	struct usb_hcd *hcd = musb->hcd;
2747 
2748 	if (musb->port_mode == MUSB_PORT_MODE_HOST) {
2749 		MUSB_HST_MODE(musb);
2750 		musb->xceiv->otg->default_a = 1;
2751 		musb->xceiv->otg->state = OTG_STATE_A_IDLE;
2752 	}
2753 	otg_set_host(musb->xceiv->otg, &hcd->self);
2754 	hcd->self.otg_port = 1;
2755 	musb->xceiv->otg->host = &hcd->self;
2756 	hcd->power_budget = 2 * (power_budget ? : 250);
2757 
2758 	ret = usb_add_hcd(hcd, 0, 0);
2759 	if (ret < 0)
2760 		return ret;
2761 
2762 	device_wakeup_enable(hcd->self.controller);
2763 	return 0;
2764 }
2765 
2766 void musb_host_resume_root_hub(struct musb *musb)
2767 {
2768 	usb_hcd_resume_root_hub(musb->hcd);
2769 }
2770 
2771 void musb_host_poke_root_hub(struct musb *musb)
2772 {
2773 	MUSB_HST_MODE(musb);
2774 	if (musb->hcd->status_urb)
2775 		usb_hcd_poll_rh_status(musb->hcd);
2776 	else
2777 		usb_hcd_resume_root_hub(musb->hcd);
2778 }
2779