xref: /openbmc/linux/drivers/net/ethernet/ibm/emac/core.c (revision eb3fcf007fffe5830d815e713591f3e858f2a365)
1 /*
2  * drivers/net/ethernet/ibm/emac/core.c
3  *
4  * Driver for PowerPC 4xx on-chip ethernet controller.
5  *
6  * Copyright 2007 Benjamin Herrenschmidt, IBM Corp.
7  *                <benh@kernel.crashing.org>
8  *
9  * Based on the arch/ppc version of the driver:
10  *
11  * Copyright (c) 2004, 2005 Zultys Technologies.
12  * Eugene Surovegin <eugene.surovegin@zultys.com> or <ebs@ebshome.net>
13  *
14  * Based on original work by
15  * 	Matt Porter <mporter@kernel.crashing.org>
16  *	(c) 2003 Benjamin Herrenschmidt <benh@kernel.crashing.org>
17  *      Armin Kuster <akuster@mvista.com>
18  * 	Johnnie Peters <jpeters@mvista.com>
19  *
20  * This program is free software; you can redistribute  it and/or modify it
21  * under  the terms of  the GNU General  Public License as published by the
22  * Free Software Foundation;  either version 2 of the  License, or (at your
23  * option) any later version.
24  *
25  */
26 
27 #include <linux/module.h>
28 #include <linux/sched.h>
29 #include <linux/string.h>
30 #include <linux/errno.h>
31 #include <linux/delay.h>
32 #include <linux/types.h>
33 #include <linux/pci.h>
34 #include <linux/etherdevice.h>
35 #include <linux/skbuff.h>
36 #include <linux/crc32.h>
37 #include <linux/ethtool.h>
38 #include <linux/mii.h>
39 #include <linux/bitops.h>
40 #include <linux/workqueue.h>
41 #include <linux/of.h>
42 #include <linux/of_address.h>
43 #include <linux/of_irq.h>
44 #include <linux/of_net.h>
45 #include <linux/slab.h>
46 
47 #include <asm/processor.h>
48 #include <asm/io.h>
49 #include <asm/dma.h>
50 #include <asm/uaccess.h>
51 #include <asm/dcr.h>
52 #include <asm/dcr-regs.h>
53 
54 #include "core.h"
55 
56 /*
57  * Lack of dma_unmap_???? calls is intentional.
58  *
59  * API-correct usage requires additional support state information to be
60  * maintained for every RX and TX buffer descriptor (BD). Unfortunately, due to
61  * EMAC design (e.g. TX buffer passed from network stack can be split into
62  * several BDs, dma_map_single/dma_map_page can be used to map particular BD),
63  * maintaining such information will add additional overhead.
64  * Current DMA API implementation for 4xx processors only ensures cache coherency
65  * and dma_unmap_???? routines are empty and are likely to stay this way.
66  * I decided to omit dma_unmap_??? calls because I don't want to add additional
67  * complexity just for the sake of following some abstract API, when it doesn't
68  * add any real benefit to the driver. I understand that this decision maybe
69  * controversial, but I really tried to make code API-correct and efficient
70  * at the same time and didn't come up with code I liked :(.                --ebs
71  */
72 
73 #define DRV_NAME        "emac"
74 #define DRV_VERSION     "3.54"
75 #define DRV_DESC        "PPC 4xx OCP EMAC driver"
76 
77 MODULE_DESCRIPTION(DRV_DESC);
78 MODULE_AUTHOR
79     ("Eugene Surovegin <eugene.surovegin@zultys.com> or <ebs@ebshome.net>");
80 MODULE_LICENSE("GPL");
81 
82 /* minimum number of free TX descriptors required to wake up TX process */
83 #define EMAC_TX_WAKEUP_THRESH		(NUM_TX_BUFF / 4)
84 
85 /* If packet size is less than this number, we allocate small skb and copy packet
86  * contents into it instead of just sending original big skb up
87  */
88 #define EMAC_RX_COPY_THRESH		CONFIG_IBM_EMAC_RX_COPY_THRESHOLD
89 
90 /* Since multiple EMACs share MDIO lines in various ways, we need
91  * to avoid re-using the same PHY ID in cases where the arch didn't
92  * setup precise phy_map entries
93  *
94  * XXX This is something that needs to be reworked as we can have multiple
95  * EMAC "sets" (multiple ASICs containing several EMACs) though we can
96  * probably require in that case to have explicit PHY IDs in the device-tree
97  */
98 static u32 busy_phy_map;
99 static DEFINE_MUTEX(emac_phy_map_lock);
100 
101 /* This is the wait queue used to wait on any event related to probe, that
102  * is discovery of MALs, other EMACs, ZMII/RGMIIs, etc...
103  */
104 static DECLARE_WAIT_QUEUE_HEAD(emac_probe_wait);
105 
106 /* Having stable interface names is a doomed idea. However, it would be nice
107  * if we didn't have completely random interface names at boot too :-) It's
108  * just a matter of making everybody's life easier. Since we are doing
109  * threaded probing, it's a bit harder though. The base idea here is that
110  * we make up a list of all emacs in the device-tree before we register the
111  * driver. Every emac will then wait for the previous one in the list to
112  * initialize before itself. We should also keep that list ordered by
113  * cell_index.
114  * That list is only 4 entries long, meaning that additional EMACs don't
115  * get ordering guarantees unless EMAC_BOOT_LIST_SIZE is increased.
116  */
117 
118 #define EMAC_BOOT_LIST_SIZE	4
119 static struct device_node *emac_boot_list[EMAC_BOOT_LIST_SIZE];
120 
121 /* How long should I wait for dependent devices ? */
122 #define EMAC_PROBE_DEP_TIMEOUT	(HZ * 5)
123 
124 /* I don't want to litter system log with timeout errors
125  * when we have brain-damaged PHY.
126  */
127 static inline void emac_report_timeout_error(struct emac_instance *dev,
128 					     const char *error)
129 {
130 	if (emac_has_feature(dev, EMAC_FTR_440GX_PHY_CLK_FIX |
131 				  EMAC_FTR_460EX_PHY_CLK_FIX |
132 				  EMAC_FTR_440EP_PHY_CLK_FIX))
133 		DBG(dev, "%s" NL, error);
134 	else if (net_ratelimit())
135 		printk(KERN_ERR "%s: %s\n", dev->ofdev->dev.of_node->full_name,
136 			error);
137 }
138 
139 /* EMAC PHY clock workaround:
140  * 440EP/440GR has more sane SDR0_MFR register implementation than 440GX,
141  * which allows controlling each EMAC clock
142  */
143 static inline void emac_rx_clk_tx(struct emac_instance *dev)
144 {
145 #ifdef CONFIG_PPC_DCR_NATIVE
146 	if (emac_has_feature(dev, EMAC_FTR_440EP_PHY_CLK_FIX))
147 		dcri_clrset(SDR0, SDR0_MFR,
148 			    0, SDR0_MFR_ECS >> dev->cell_index);
149 #endif
150 }
151 
152 static inline void emac_rx_clk_default(struct emac_instance *dev)
153 {
154 #ifdef CONFIG_PPC_DCR_NATIVE
155 	if (emac_has_feature(dev, EMAC_FTR_440EP_PHY_CLK_FIX))
156 		dcri_clrset(SDR0, SDR0_MFR,
157 			    SDR0_MFR_ECS >> dev->cell_index, 0);
158 #endif
159 }
160 
161 /* PHY polling intervals */
162 #define PHY_POLL_LINK_ON	HZ
163 #define PHY_POLL_LINK_OFF	(HZ / 5)
164 
165 /* Graceful stop timeouts in us.
166  * We should allow up to 1 frame time (full-duplex, ignoring collisions)
167  */
168 #define STOP_TIMEOUT_10		1230
169 #define STOP_TIMEOUT_100	124
170 #define STOP_TIMEOUT_1000	13
171 #define STOP_TIMEOUT_1000_JUMBO	73
172 
173 static unsigned char default_mcast_addr[] = {
174 	0x01, 0x80, 0xC2, 0x00, 0x00, 0x01
175 };
176 
177 /* Please, keep in sync with struct ibm_emac_stats/ibm_emac_error_stats */
178 static const char emac_stats_keys[EMAC_ETHTOOL_STATS_COUNT][ETH_GSTRING_LEN] = {
179 	"rx_packets", "rx_bytes", "tx_packets", "tx_bytes", "rx_packets_csum",
180 	"tx_packets_csum", "tx_undo", "rx_dropped_stack", "rx_dropped_oom",
181 	"rx_dropped_error", "rx_dropped_resize", "rx_dropped_mtu",
182 	"rx_stopped", "rx_bd_errors", "rx_bd_overrun", "rx_bd_bad_packet",
183 	"rx_bd_runt_packet", "rx_bd_short_event", "rx_bd_alignment_error",
184 	"rx_bd_bad_fcs", "rx_bd_packet_too_long", "rx_bd_out_of_range",
185 	"rx_bd_in_range", "rx_parity", "rx_fifo_overrun", "rx_overrun",
186 	"rx_bad_packet", "rx_runt_packet", "rx_short_event",
187 	"rx_alignment_error", "rx_bad_fcs", "rx_packet_too_long",
188 	"rx_out_of_range", "rx_in_range", "tx_dropped", "tx_bd_errors",
189 	"tx_bd_bad_fcs", "tx_bd_carrier_loss", "tx_bd_excessive_deferral",
190 	"tx_bd_excessive_collisions", "tx_bd_late_collision",
191 	"tx_bd_multple_collisions", "tx_bd_single_collision",
192 	"tx_bd_underrun", "tx_bd_sqe", "tx_parity", "tx_underrun", "tx_sqe",
193 	"tx_errors"
194 };
195 
196 static irqreturn_t emac_irq(int irq, void *dev_instance);
197 static void emac_clean_tx_ring(struct emac_instance *dev);
198 static void __emac_set_multicast_list(struct emac_instance *dev);
199 
200 static inline int emac_phy_supports_gige(int phy_mode)
201 {
202 	return  phy_mode == PHY_MODE_GMII ||
203 		phy_mode == PHY_MODE_RGMII ||
204 		phy_mode == PHY_MODE_SGMII ||
205 		phy_mode == PHY_MODE_TBI ||
206 		phy_mode == PHY_MODE_RTBI;
207 }
208 
209 static inline int emac_phy_gpcs(int phy_mode)
210 {
211 	return  phy_mode == PHY_MODE_SGMII ||
212 		phy_mode == PHY_MODE_TBI ||
213 		phy_mode == PHY_MODE_RTBI;
214 }
215 
216 static inline void emac_tx_enable(struct emac_instance *dev)
217 {
218 	struct emac_regs __iomem *p = dev->emacp;
219 	u32 r;
220 
221 	DBG(dev, "tx_enable" NL);
222 
223 	r = in_be32(&p->mr0);
224 	if (!(r & EMAC_MR0_TXE))
225 		out_be32(&p->mr0, r | EMAC_MR0_TXE);
226 }
227 
228 static void emac_tx_disable(struct emac_instance *dev)
229 {
230 	struct emac_regs __iomem *p = dev->emacp;
231 	u32 r;
232 
233 	DBG(dev, "tx_disable" NL);
234 
235 	r = in_be32(&p->mr0);
236 	if (r & EMAC_MR0_TXE) {
237 		int n = dev->stop_timeout;
238 		out_be32(&p->mr0, r & ~EMAC_MR0_TXE);
239 		while (!(in_be32(&p->mr0) & EMAC_MR0_TXI) && n) {
240 			udelay(1);
241 			--n;
242 		}
243 		if (unlikely(!n))
244 			emac_report_timeout_error(dev, "TX disable timeout");
245 	}
246 }
247 
248 static void emac_rx_enable(struct emac_instance *dev)
249 {
250 	struct emac_regs __iomem *p = dev->emacp;
251 	u32 r;
252 
253 	if (unlikely(test_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags)))
254 		goto out;
255 
256 	DBG(dev, "rx_enable" NL);
257 
258 	r = in_be32(&p->mr0);
259 	if (!(r & EMAC_MR0_RXE)) {
260 		if (unlikely(!(r & EMAC_MR0_RXI))) {
261 			/* Wait if previous async disable is still in progress */
262 			int n = dev->stop_timeout;
263 			while (!(r = in_be32(&p->mr0) & EMAC_MR0_RXI) && n) {
264 				udelay(1);
265 				--n;
266 			}
267 			if (unlikely(!n))
268 				emac_report_timeout_error(dev,
269 							  "RX disable timeout");
270 		}
271 		out_be32(&p->mr0, r | EMAC_MR0_RXE);
272 	}
273  out:
274 	;
275 }
276 
277 static void emac_rx_disable(struct emac_instance *dev)
278 {
279 	struct emac_regs __iomem *p = dev->emacp;
280 	u32 r;
281 
282 	DBG(dev, "rx_disable" NL);
283 
284 	r = in_be32(&p->mr0);
285 	if (r & EMAC_MR0_RXE) {
286 		int n = dev->stop_timeout;
287 		out_be32(&p->mr0, r & ~EMAC_MR0_RXE);
288 		while (!(in_be32(&p->mr0) & EMAC_MR0_RXI) && n) {
289 			udelay(1);
290 			--n;
291 		}
292 		if (unlikely(!n))
293 			emac_report_timeout_error(dev, "RX disable timeout");
294 	}
295 }
296 
297 static inline void emac_netif_stop(struct emac_instance *dev)
298 {
299 	netif_tx_lock_bh(dev->ndev);
300 	netif_addr_lock(dev->ndev);
301 	dev->no_mcast = 1;
302 	netif_addr_unlock(dev->ndev);
303 	netif_tx_unlock_bh(dev->ndev);
304 	dev->ndev->trans_start = jiffies;	/* prevent tx timeout */
305 	mal_poll_disable(dev->mal, &dev->commac);
306 	netif_tx_disable(dev->ndev);
307 }
308 
309 static inline void emac_netif_start(struct emac_instance *dev)
310 {
311 	netif_tx_lock_bh(dev->ndev);
312 	netif_addr_lock(dev->ndev);
313 	dev->no_mcast = 0;
314 	if (dev->mcast_pending && netif_running(dev->ndev))
315 		__emac_set_multicast_list(dev);
316 	netif_addr_unlock(dev->ndev);
317 	netif_tx_unlock_bh(dev->ndev);
318 
319 	netif_wake_queue(dev->ndev);
320 
321 	/* NOTE: unconditional netif_wake_queue is only appropriate
322 	 * so long as all callers are assured to have free tx slots
323 	 * (taken from tg3... though the case where that is wrong is
324 	 *  not terribly harmful)
325 	 */
326 	mal_poll_enable(dev->mal, &dev->commac);
327 }
328 
329 static inline void emac_rx_disable_async(struct emac_instance *dev)
330 {
331 	struct emac_regs __iomem *p = dev->emacp;
332 	u32 r;
333 
334 	DBG(dev, "rx_disable_async" NL);
335 
336 	r = in_be32(&p->mr0);
337 	if (r & EMAC_MR0_RXE)
338 		out_be32(&p->mr0, r & ~EMAC_MR0_RXE);
339 }
340 
341 static int emac_reset(struct emac_instance *dev)
342 {
343 	struct emac_regs __iomem *p = dev->emacp;
344 	int n = 20;
345 
346 	DBG(dev, "reset" NL);
347 
348 	if (!dev->reset_failed) {
349 		/* 40x erratum suggests stopping RX channel before reset,
350 		 * we stop TX as well
351 		 */
352 		emac_rx_disable(dev);
353 		emac_tx_disable(dev);
354 	}
355 
356 #ifdef CONFIG_PPC_DCR_NATIVE
357 	/*
358 	 * PPC460EX/GT Embedded Processor Advanced User's Manual
359 	 * section 28.10.1 Mode Register 0 (EMACx_MR0) states:
360 	 * Note: The PHY must provide a TX Clk in order to perform a soft reset
361 	 * of the EMAC. If none is present, select the internal clock
362 	 * (SDR0_ETH_CFG[EMACx_PHY_CLK] = 1).
363 	 * After a soft reset, select the external clock.
364 	 */
365 	if (emac_has_feature(dev, EMAC_FTR_460EX_PHY_CLK_FIX)) {
366 		if (dev->phy_address == 0xffffffff &&
367 		    dev->phy_map == 0xffffffff) {
368 			/* No PHY: select internal loop clock before reset */
369 			dcri_clrset(SDR0, SDR0_ETH_CFG,
370 				    0, SDR0_ETH_CFG_ECS << dev->cell_index);
371 		} else {
372 			/* PHY present: select external clock before reset */
373 			dcri_clrset(SDR0, SDR0_ETH_CFG,
374 				    SDR0_ETH_CFG_ECS << dev->cell_index, 0);
375 		}
376 	}
377 #endif
378 
379 	out_be32(&p->mr0, EMAC_MR0_SRST);
380 	while ((in_be32(&p->mr0) & EMAC_MR0_SRST) && n)
381 		--n;
382 
383 #ifdef CONFIG_PPC_DCR_NATIVE
384 	if (emac_has_feature(dev, EMAC_FTR_460EX_PHY_CLK_FIX)) {
385 		if (dev->phy_address == 0xffffffff &&
386 		    dev->phy_map == 0xffffffff) {
387 			/* No PHY: restore external clock source after reset */
388 			dcri_clrset(SDR0, SDR0_ETH_CFG,
389 				    SDR0_ETH_CFG_ECS << dev->cell_index, 0);
390 		}
391 	}
392 #endif
393 
394 	if (n) {
395 		dev->reset_failed = 0;
396 		return 0;
397 	} else {
398 		emac_report_timeout_error(dev, "reset timeout");
399 		dev->reset_failed = 1;
400 		return -ETIMEDOUT;
401 	}
402 }
403 
404 static void emac_hash_mc(struct emac_instance *dev)
405 {
406 	const int regs = EMAC_XAHT_REGS(dev);
407 	u32 *gaht_base = emac_gaht_base(dev);
408 	u32 gaht_temp[regs];
409 	struct netdev_hw_addr *ha;
410 	int i;
411 
412 	DBG(dev, "hash_mc %d" NL, netdev_mc_count(dev->ndev));
413 
414 	memset(gaht_temp, 0, sizeof (gaht_temp));
415 
416 	netdev_for_each_mc_addr(ha, dev->ndev) {
417 		int slot, reg, mask;
418 		DBG2(dev, "mc %pM" NL, ha->addr);
419 
420 		slot = EMAC_XAHT_CRC_TO_SLOT(dev,
421 					     ether_crc(ETH_ALEN, ha->addr));
422 		reg = EMAC_XAHT_SLOT_TO_REG(dev, slot);
423 		mask = EMAC_XAHT_SLOT_TO_MASK(dev, slot);
424 
425 		gaht_temp[reg] |= mask;
426 	}
427 
428 	for (i = 0; i < regs; i++)
429 		out_be32(gaht_base + i, gaht_temp[i]);
430 }
431 
432 static inline u32 emac_iff2rmr(struct net_device *ndev)
433 {
434 	struct emac_instance *dev = netdev_priv(ndev);
435 	u32 r;
436 
437 	r = EMAC_RMR_SP | EMAC_RMR_SFCS | EMAC_RMR_IAE | EMAC_RMR_BAE;
438 
439 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
440 	    r |= EMAC4_RMR_BASE;
441 	else
442 	    r |= EMAC_RMR_BASE;
443 
444 	if (ndev->flags & IFF_PROMISC)
445 		r |= EMAC_RMR_PME;
446 	else if (ndev->flags & IFF_ALLMULTI ||
447 			 (netdev_mc_count(ndev) > EMAC_XAHT_SLOTS(dev)))
448 		r |= EMAC_RMR_PMME;
449 	else if (!netdev_mc_empty(ndev))
450 		r |= EMAC_RMR_MAE;
451 
452 	if (emac_has_feature(dev, EMAC_APM821XX_REQ_JUMBO_FRAME_SIZE)) {
453 		r &= ~EMAC4_RMR_MJS_MASK;
454 		r |= EMAC4_RMR_MJS(ndev->mtu);
455 	}
456 
457 	return r;
458 }
459 
460 static u32 __emac_calc_base_mr1(struct emac_instance *dev, int tx_size, int rx_size)
461 {
462 	u32 ret = EMAC_MR1_VLE | EMAC_MR1_IST | EMAC_MR1_TR0_MULT;
463 
464 	DBG2(dev, "__emac_calc_base_mr1" NL);
465 
466 	switch(tx_size) {
467 	case 2048:
468 		ret |= EMAC_MR1_TFS_2K;
469 		break;
470 	default:
471 		printk(KERN_WARNING "%s: Unknown Tx FIFO size %d\n",
472 		       dev->ndev->name, tx_size);
473 	}
474 
475 	switch(rx_size) {
476 	case 16384:
477 		ret |= EMAC_MR1_RFS_16K;
478 		break;
479 	case 4096:
480 		ret |= EMAC_MR1_RFS_4K;
481 		break;
482 	default:
483 		printk(KERN_WARNING "%s: Unknown Rx FIFO size %d\n",
484 		       dev->ndev->name, rx_size);
485 	}
486 
487 	return ret;
488 }
489 
490 static u32 __emac4_calc_base_mr1(struct emac_instance *dev, int tx_size, int rx_size)
491 {
492 	u32 ret = EMAC_MR1_VLE | EMAC_MR1_IST | EMAC4_MR1_TR |
493 		EMAC4_MR1_OBCI(dev->opb_bus_freq / 1000000);
494 
495 	DBG2(dev, "__emac4_calc_base_mr1" NL);
496 
497 	switch(tx_size) {
498 	case 16384:
499 		ret |= EMAC4_MR1_TFS_16K;
500 		break;
501 	case 4096:
502 		ret |= EMAC4_MR1_TFS_4K;
503 		break;
504 	case 2048:
505 		ret |= EMAC4_MR1_TFS_2K;
506 		break;
507 	default:
508 		printk(KERN_WARNING "%s: Unknown Tx FIFO size %d\n",
509 		       dev->ndev->name, tx_size);
510 	}
511 
512 	switch(rx_size) {
513 	case 16384:
514 		ret |= EMAC4_MR1_RFS_16K;
515 		break;
516 	case 4096:
517 		ret |= EMAC4_MR1_RFS_4K;
518 		break;
519 	case 2048:
520 		ret |= EMAC4_MR1_RFS_2K;
521 		break;
522 	default:
523 		printk(KERN_WARNING "%s: Unknown Rx FIFO size %d\n",
524 		       dev->ndev->name, rx_size);
525 	}
526 
527 	return ret;
528 }
529 
530 static u32 emac_calc_base_mr1(struct emac_instance *dev, int tx_size, int rx_size)
531 {
532 	return emac_has_feature(dev, EMAC_FTR_EMAC4) ?
533 		__emac4_calc_base_mr1(dev, tx_size, rx_size) :
534 		__emac_calc_base_mr1(dev, tx_size, rx_size);
535 }
536 
537 static inline u32 emac_calc_trtr(struct emac_instance *dev, unsigned int size)
538 {
539 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
540 		return ((size >> 6) - 1) << EMAC_TRTR_SHIFT_EMAC4;
541 	else
542 		return ((size >> 6) - 1) << EMAC_TRTR_SHIFT;
543 }
544 
545 static inline u32 emac_calc_rwmr(struct emac_instance *dev,
546 				 unsigned int low, unsigned int high)
547 {
548 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
549 		return (low << 22) | ( (high & 0x3ff) << 6);
550 	else
551 		return (low << 23) | ( (high & 0x1ff) << 7);
552 }
553 
554 static int emac_configure(struct emac_instance *dev)
555 {
556 	struct emac_regs __iomem *p = dev->emacp;
557 	struct net_device *ndev = dev->ndev;
558 	int tx_size, rx_size, link = netif_carrier_ok(dev->ndev);
559 	u32 r, mr1 = 0;
560 
561 	DBG(dev, "configure" NL);
562 
563 	if (!link) {
564 		out_be32(&p->mr1, in_be32(&p->mr1)
565 			 | EMAC_MR1_FDE | EMAC_MR1_ILE);
566 		udelay(100);
567 	} else if (emac_reset(dev) < 0)
568 		return -ETIMEDOUT;
569 
570 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH))
571 		tah_reset(dev->tah_dev);
572 
573 	DBG(dev, " link = %d duplex = %d, pause = %d, asym_pause = %d\n",
574 	    link, dev->phy.duplex, dev->phy.pause, dev->phy.asym_pause);
575 
576 	/* Default fifo sizes */
577 	tx_size = dev->tx_fifo_size;
578 	rx_size = dev->rx_fifo_size;
579 
580 	/* No link, force loopback */
581 	if (!link)
582 		mr1 = EMAC_MR1_FDE | EMAC_MR1_ILE;
583 
584 	/* Check for full duplex */
585 	else if (dev->phy.duplex == DUPLEX_FULL)
586 		mr1 |= EMAC_MR1_FDE | EMAC_MR1_MWSW_001;
587 
588 	/* Adjust fifo sizes, mr1 and timeouts based on link speed */
589 	dev->stop_timeout = STOP_TIMEOUT_10;
590 	switch (dev->phy.speed) {
591 	case SPEED_1000:
592 		if (emac_phy_gpcs(dev->phy.mode)) {
593 			mr1 |= EMAC_MR1_MF_1000GPCS | EMAC_MR1_MF_IPPA(
594 				(dev->phy.gpcs_address != 0xffffffff) ?
595 				 dev->phy.gpcs_address : dev->phy.address);
596 
597 			/* Put some arbitrary OUI, Manuf & Rev IDs so we can
598 			 * identify this GPCS PHY later.
599 			 */
600 			out_be32(&p->u1.emac4.ipcr, 0xdeadbeef);
601 		} else
602 			mr1 |= EMAC_MR1_MF_1000;
603 
604 		/* Extended fifo sizes */
605 		tx_size = dev->tx_fifo_size_gige;
606 		rx_size = dev->rx_fifo_size_gige;
607 
608 		if (dev->ndev->mtu > ETH_DATA_LEN) {
609 			if (emac_has_feature(dev, EMAC_FTR_EMAC4))
610 				mr1 |= EMAC4_MR1_JPSM;
611 			else
612 				mr1 |= EMAC_MR1_JPSM;
613 			dev->stop_timeout = STOP_TIMEOUT_1000_JUMBO;
614 		} else
615 			dev->stop_timeout = STOP_TIMEOUT_1000;
616 		break;
617 	case SPEED_100:
618 		mr1 |= EMAC_MR1_MF_100;
619 		dev->stop_timeout = STOP_TIMEOUT_100;
620 		break;
621 	default: /* make gcc happy */
622 		break;
623 	}
624 
625 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
626 		rgmii_set_speed(dev->rgmii_dev, dev->rgmii_port,
627 				dev->phy.speed);
628 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
629 		zmii_set_speed(dev->zmii_dev, dev->zmii_port, dev->phy.speed);
630 
631 	/* on 40x erratum forces us to NOT use integrated flow control,
632 	 * let's hope it works on 44x ;)
633 	 */
634 	if (!emac_has_feature(dev, EMAC_FTR_NO_FLOW_CONTROL_40x) &&
635 	    dev->phy.duplex == DUPLEX_FULL) {
636 		if (dev->phy.pause)
637 			mr1 |= EMAC_MR1_EIFC | EMAC_MR1_APP;
638 		else if (dev->phy.asym_pause)
639 			mr1 |= EMAC_MR1_APP;
640 	}
641 
642 	/* Add base settings & fifo sizes & program MR1 */
643 	mr1 |= emac_calc_base_mr1(dev, tx_size, rx_size);
644 	out_be32(&p->mr1, mr1);
645 
646 	/* Set individual MAC address */
647 	out_be32(&p->iahr, (ndev->dev_addr[0] << 8) | ndev->dev_addr[1]);
648 	out_be32(&p->ialr, (ndev->dev_addr[2] << 24) |
649 		 (ndev->dev_addr[3] << 16) | (ndev->dev_addr[4] << 8) |
650 		 ndev->dev_addr[5]);
651 
652 	/* VLAN Tag Protocol ID */
653 	out_be32(&p->vtpid, 0x8100);
654 
655 	/* Receive mode register */
656 	r = emac_iff2rmr(ndev);
657 	if (r & EMAC_RMR_MAE)
658 		emac_hash_mc(dev);
659 	out_be32(&p->rmr, r);
660 
661 	/* FIFOs thresholds */
662 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
663 		r = EMAC4_TMR1((dev->mal_burst_size / dev->fifo_entry_size) + 1,
664 			       tx_size / 2 / dev->fifo_entry_size);
665 	else
666 		r = EMAC_TMR1((dev->mal_burst_size / dev->fifo_entry_size) + 1,
667 			      tx_size / 2 / dev->fifo_entry_size);
668 	out_be32(&p->tmr1, r);
669 	out_be32(&p->trtr, emac_calc_trtr(dev, tx_size / 2));
670 
671 	/* PAUSE frame is sent when RX FIFO reaches its high-water mark,
672 	   there should be still enough space in FIFO to allow the our link
673 	   partner time to process this frame and also time to send PAUSE
674 	   frame itself.
675 
676 	   Here is the worst case scenario for the RX FIFO "headroom"
677 	   (from "The Switch Book") (100Mbps, without preamble, inter-frame gap):
678 
679 	   1) One maximum-length frame on TX                    1522 bytes
680 	   2) One PAUSE frame time                                64 bytes
681 	   3) PAUSE frame decode time allowance                   64 bytes
682 	   4) One maximum-length frame on RX                    1522 bytes
683 	   5) Round-trip propagation delay of the link (100Mb)    15 bytes
684 	   ----------
685 	   3187 bytes
686 
687 	   I chose to set high-water mark to RX_FIFO_SIZE / 4 (1024 bytes)
688 	   low-water mark  to RX_FIFO_SIZE / 8 (512 bytes)
689 	 */
690 	r = emac_calc_rwmr(dev, rx_size / 8 / dev->fifo_entry_size,
691 			   rx_size / 4 / dev->fifo_entry_size);
692 	out_be32(&p->rwmr, r);
693 
694 	/* Set PAUSE timer to the maximum */
695 	out_be32(&p->ptr, 0xffff);
696 
697 	/* IRQ sources */
698 	r = EMAC_ISR_OVR | EMAC_ISR_BP | EMAC_ISR_SE |
699 		EMAC_ISR_ALE | EMAC_ISR_BFCS | EMAC_ISR_PTLE | EMAC_ISR_ORE |
700 		EMAC_ISR_IRE | EMAC_ISR_TE;
701 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
702 	    r |= EMAC4_ISR_TXPE | EMAC4_ISR_RXPE /* | EMAC4_ISR_TXUE |
703 						  EMAC4_ISR_RXOE | */;
704 	out_be32(&p->iser,  r);
705 
706 	/* We need to take GPCS PHY out of isolate mode after EMAC reset */
707 	if (emac_phy_gpcs(dev->phy.mode)) {
708 		if (dev->phy.gpcs_address != 0xffffffff)
709 			emac_mii_reset_gpcs(&dev->phy);
710 		else
711 			emac_mii_reset_phy(&dev->phy);
712 	}
713 
714 	return 0;
715 }
716 
717 static void emac_reinitialize(struct emac_instance *dev)
718 {
719 	DBG(dev, "reinitialize" NL);
720 
721 	emac_netif_stop(dev);
722 	if (!emac_configure(dev)) {
723 		emac_tx_enable(dev);
724 		emac_rx_enable(dev);
725 	}
726 	emac_netif_start(dev);
727 }
728 
729 static void emac_full_tx_reset(struct emac_instance *dev)
730 {
731 	DBG(dev, "full_tx_reset" NL);
732 
733 	emac_tx_disable(dev);
734 	mal_disable_tx_channel(dev->mal, dev->mal_tx_chan);
735 	emac_clean_tx_ring(dev);
736 	dev->tx_cnt = dev->tx_slot = dev->ack_slot = 0;
737 
738 	emac_configure(dev);
739 
740 	mal_enable_tx_channel(dev->mal, dev->mal_tx_chan);
741 	emac_tx_enable(dev);
742 	emac_rx_enable(dev);
743 }
744 
745 static void emac_reset_work(struct work_struct *work)
746 {
747 	struct emac_instance *dev = container_of(work, struct emac_instance, reset_work);
748 
749 	DBG(dev, "reset_work" NL);
750 
751 	mutex_lock(&dev->link_lock);
752 	if (dev->opened) {
753 		emac_netif_stop(dev);
754 		emac_full_tx_reset(dev);
755 		emac_netif_start(dev);
756 	}
757 	mutex_unlock(&dev->link_lock);
758 }
759 
760 static void emac_tx_timeout(struct net_device *ndev)
761 {
762 	struct emac_instance *dev = netdev_priv(ndev);
763 
764 	DBG(dev, "tx_timeout" NL);
765 
766 	schedule_work(&dev->reset_work);
767 }
768 
769 
770 static inline int emac_phy_done(struct emac_instance *dev, u32 stacr)
771 {
772 	int done = !!(stacr & EMAC_STACR_OC);
773 
774 	if (emac_has_feature(dev, EMAC_FTR_STACR_OC_INVERT))
775 		done = !done;
776 
777 	return done;
778 };
779 
780 static int __emac_mdio_read(struct emac_instance *dev, u8 id, u8 reg)
781 {
782 	struct emac_regs __iomem *p = dev->emacp;
783 	u32 r = 0;
784 	int n, err = -ETIMEDOUT;
785 
786 	mutex_lock(&dev->mdio_lock);
787 
788 	DBG2(dev, "mdio_read(%02x,%02x)" NL, id, reg);
789 
790 	/* Enable proper MDIO port */
791 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
792 		zmii_get_mdio(dev->zmii_dev, dev->zmii_port);
793 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
794 		rgmii_get_mdio(dev->rgmii_dev, dev->rgmii_port);
795 
796 	/* Wait for management interface to become idle */
797 	n = 20;
798 	while (!emac_phy_done(dev, in_be32(&p->stacr))) {
799 		udelay(1);
800 		if (!--n) {
801 			DBG2(dev, " -> timeout wait idle\n");
802 			goto bail;
803 		}
804 	}
805 
806 	/* Issue read command */
807 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
808 		r = EMAC4_STACR_BASE(dev->opb_bus_freq);
809 	else
810 		r = EMAC_STACR_BASE(dev->opb_bus_freq);
811 	if (emac_has_feature(dev, EMAC_FTR_STACR_OC_INVERT))
812 		r |= EMAC_STACR_OC;
813 	if (emac_has_feature(dev, EMAC_FTR_HAS_NEW_STACR))
814 		r |= EMACX_STACR_STAC_READ;
815 	else
816 		r |= EMAC_STACR_STAC_READ;
817 	r |= (reg & EMAC_STACR_PRA_MASK)
818 		| ((id & EMAC_STACR_PCDA_MASK) << EMAC_STACR_PCDA_SHIFT);
819 	out_be32(&p->stacr, r);
820 
821 	/* Wait for read to complete */
822 	n = 200;
823 	while (!emac_phy_done(dev, (r = in_be32(&p->stacr)))) {
824 		udelay(1);
825 		if (!--n) {
826 			DBG2(dev, " -> timeout wait complete\n");
827 			goto bail;
828 		}
829 	}
830 
831 	if (unlikely(r & EMAC_STACR_PHYE)) {
832 		DBG(dev, "mdio_read(%02x, %02x) failed" NL, id, reg);
833 		err = -EREMOTEIO;
834 		goto bail;
835 	}
836 
837 	r = ((r >> EMAC_STACR_PHYD_SHIFT) & EMAC_STACR_PHYD_MASK);
838 
839 	DBG2(dev, "mdio_read -> %04x" NL, r);
840 	err = 0;
841  bail:
842 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
843 		rgmii_put_mdio(dev->rgmii_dev, dev->rgmii_port);
844 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
845 		zmii_put_mdio(dev->zmii_dev, dev->zmii_port);
846 	mutex_unlock(&dev->mdio_lock);
847 
848 	return err == 0 ? r : err;
849 }
850 
851 static void __emac_mdio_write(struct emac_instance *dev, u8 id, u8 reg,
852 			      u16 val)
853 {
854 	struct emac_regs __iomem *p = dev->emacp;
855 	u32 r = 0;
856 	int n, err = -ETIMEDOUT;
857 
858 	mutex_lock(&dev->mdio_lock);
859 
860 	DBG2(dev, "mdio_write(%02x,%02x,%04x)" NL, id, reg, val);
861 
862 	/* Enable proper MDIO port */
863 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
864 		zmii_get_mdio(dev->zmii_dev, dev->zmii_port);
865 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
866 		rgmii_get_mdio(dev->rgmii_dev, dev->rgmii_port);
867 
868 	/* Wait for management interface to be idle */
869 	n = 20;
870 	while (!emac_phy_done(dev, in_be32(&p->stacr))) {
871 		udelay(1);
872 		if (!--n) {
873 			DBG2(dev, " -> timeout wait idle\n");
874 			goto bail;
875 		}
876 	}
877 
878 	/* Issue write command */
879 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
880 		r = EMAC4_STACR_BASE(dev->opb_bus_freq);
881 	else
882 		r = EMAC_STACR_BASE(dev->opb_bus_freq);
883 	if (emac_has_feature(dev, EMAC_FTR_STACR_OC_INVERT))
884 		r |= EMAC_STACR_OC;
885 	if (emac_has_feature(dev, EMAC_FTR_HAS_NEW_STACR))
886 		r |= EMACX_STACR_STAC_WRITE;
887 	else
888 		r |= EMAC_STACR_STAC_WRITE;
889 	r |= (reg & EMAC_STACR_PRA_MASK) |
890 		((id & EMAC_STACR_PCDA_MASK) << EMAC_STACR_PCDA_SHIFT) |
891 		(val << EMAC_STACR_PHYD_SHIFT);
892 	out_be32(&p->stacr, r);
893 
894 	/* Wait for write to complete */
895 	n = 200;
896 	while (!emac_phy_done(dev, in_be32(&p->stacr))) {
897 		udelay(1);
898 		if (!--n) {
899 			DBG2(dev, " -> timeout wait complete\n");
900 			goto bail;
901 		}
902 	}
903 	err = 0;
904  bail:
905 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
906 		rgmii_put_mdio(dev->rgmii_dev, dev->rgmii_port);
907 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
908 		zmii_put_mdio(dev->zmii_dev, dev->zmii_port);
909 	mutex_unlock(&dev->mdio_lock);
910 }
911 
912 static int emac_mdio_read(struct net_device *ndev, int id, int reg)
913 {
914 	struct emac_instance *dev = netdev_priv(ndev);
915 	int res;
916 
917 	res = __emac_mdio_read((dev->mdio_instance &&
918 				dev->phy.gpcs_address != id) ?
919 				dev->mdio_instance : dev,
920 			       (u8) id, (u8) reg);
921 	return res;
922 }
923 
924 static void emac_mdio_write(struct net_device *ndev, int id, int reg, int val)
925 {
926 	struct emac_instance *dev = netdev_priv(ndev);
927 
928 	__emac_mdio_write((dev->mdio_instance &&
929 			   dev->phy.gpcs_address != id) ?
930 			   dev->mdio_instance : dev,
931 			  (u8) id, (u8) reg, (u16) val);
932 }
933 
934 /* Tx lock BH */
935 static void __emac_set_multicast_list(struct emac_instance *dev)
936 {
937 	struct emac_regs __iomem *p = dev->emacp;
938 	u32 rmr = emac_iff2rmr(dev->ndev);
939 
940 	DBG(dev, "__multicast %08x" NL, rmr);
941 
942 	/* I decided to relax register access rules here to avoid
943 	 * full EMAC reset.
944 	 *
945 	 * There is a real problem with EMAC4 core if we use MWSW_001 bit
946 	 * in MR1 register and do a full EMAC reset.
947 	 * One TX BD status update is delayed and, after EMAC reset, it
948 	 * never happens, resulting in TX hung (it'll be recovered by TX
949 	 * timeout handler eventually, but this is just gross).
950 	 * So we either have to do full TX reset or try to cheat here :)
951 	 *
952 	 * The only required change is to RX mode register, so I *think* all
953 	 * we need is just to stop RX channel. This seems to work on all
954 	 * tested SoCs.                                                --ebs
955 	 *
956 	 * If we need the full reset, we might just trigger the workqueue
957 	 * and do it async... a bit nasty but should work --BenH
958 	 */
959 	dev->mcast_pending = 0;
960 	emac_rx_disable(dev);
961 	if (rmr & EMAC_RMR_MAE)
962 		emac_hash_mc(dev);
963 	out_be32(&p->rmr, rmr);
964 	emac_rx_enable(dev);
965 }
966 
967 /* Tx lock BH */
968 static void emac_set_multicast_list(struct net_device *ndev)
969 {
970 	struct emac_instance *dev = netdev_priv(ndev);
971 
972 	DBG(dev, "multicast" NL);
973 
974 	BUG_ON(!netif_running(dev->ndev));
975 
976 	if (dev->no_mcast) {
977 		dev->mcast_pending = 1;
978 		return;
979 	}
980 	__emac_set_multicast_list(dev);
981 }
982 
983 static int emac_resize_rx_ring(struct emac_instance *dev, int new_mtu)
984 {
985 	int rx_sync_size = emac_rx_sync_size(new_mtu);
986 	int rx_skb_size = emac_rx_skb_size(new_mtu);
987 	int i, ret = 0;
988 	int mr1_jumbo_bit_change = 0;
989 
990 	mutex_lock(&dev->link_lock);
991 	emac_netif_stop(dev);
992 	emac_rx_disable(dev);
993 	mal_disable_rx_channel(dev->mal, dev->mal_rx_chan);
994 
995 	if (dev->rx_sg_skb) {
996 		++dev->estats.rx_dropped_resize;
997 		dev_kfree_skb(dev->rx_sg_skb);
998 		dev->rx_sg_skb = NULL;
999 	}
1000 
1001 	/* Make a first pass over RX ring and mark BDs ready, dropping
1002 	 * non-processed packets on the way. We need this as a separate pass
1003 	 * to simplify error recovery in the case of allocation failure later.
1004 	 */
1005 	for (i = 0; i < NUM_RX_BUFF; ++i) {
1006 		if (dev->rx_desc[i].ctrl & MAL_RX_CTRL_FIRST)
1007 			++dev->estats.rx_dropped_resize;
1008 
1009 		dev->rx_desc[i].data_len = 0;
1010 		dev->rx_desc[i].ctrl = MAL_RX_CTRL_EMPTY |
1011 		    (i == (NUM_RX_BUFF - 1) ? MAL_RX_CTRL_WRAP : 0);
1012 	}
1013 
1014 	/* Reallocate RX ring only if bigger skb buffers are required */
1015 	if (rx_skb_size <= dev->rx_skb_size)
1016 		goto skip;
1017 
1018 	/* Second pass, allocate new skbs */
1019 	for (i = 0; i < NUM_RX_BUFF; ++i) {
1020 		struct sk_buff *skb = alloc_skb(rx_skb_size, GFP_ATOMIC);
1021 		if (!skb) {
1022 			ret = -ENOMEM;
1023 			goto oom;
1024 		}
1025 
1026 		BUG_ON(!dev->rx_skb[i]);
1027 		dev_kfree_skb(dev->rx_skb[i]);
1028 
1029 		skb_reserve(skb, EMAC_RX_SKB_HEADROOM + 2);
1030 		dev->rx_desc[i].data_ptr =
1031 		    dma_map_single(&dev->ofdev->dev, skb->data - 2, rx_sync_size,
1032 				   DMA_FROM_DEVICE) + 2;
1033 		dev->rx_skb[i] = skb;
1034 	}
1035  skip:
1036 	/* Check if we need to change "Jumbo" bit in MR1 */
1037 	if (emac_has_feature(dev, EMAC_APM821XX_REQ_JUMBO_FRAME_SIZE)) {
1038 		mr1_jumbo_bit_change = (new_mtu > ETH_DATA_LEN) ||
1039 				(dev->ndev->mtu > ETH_DATA_LEN);
1040 	} else {
1041 		mr1_jumbo_bit_change = (new_mtu > ETH_DATA_LEN) ^
1042 				(dev->ndev->mtu > ETH_DATA_LEN);
1043 	}
1044 
1045 	if (mr1_jumbo_bit_change) {
1046 		/* This is to prevent starting RX channel in emac_rx_enable() */
1047 		set_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags);
1048 
1049 		dev->ndev->mtu = new_mtu;
1050 		emac_full_tx_reset(dev);
1051 	}
1052 
1053 	mal_set_rcbs(dev->mal, dev->mal_rx_chan, emac_rx_size(new_mtu));
1054  oom:
1055 	/* Restart RX */
1056 	clear_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags);
1057 	dev->rx_slot = 0;
1058 	mal_enable_rx_channel(dev->mal, dev->mal_rx_chan);
1059 	emac_rx_enable(dev);
1060 	emac_netif_start(dev);
1061 	mutex_unlock(&dev->link_lock);
1062 
1063 	return ret;
1064 }
1065 
1066 /* Process ctx, rtnl_lock semaphore */
1067 static int emac_change_mtu(struct net_device *ndev, int new_mtu)
1068 {
1069 	struct emac_instance *dev = netdev_priv(ndev);
1070 	int ret = 0;
1071 
1072 	if (new_mtu < EMAC_MIN_MTU || new_mtu > dev->max_mtu)
1073 		return -EINVAL;
1074 
1075 	DBG(dev, "change_mtu(%d)" NL, new_mtu);
1076 
1077 	if (netif_running(ndev)) {
1078 		/* Check if we really need to reinitialize RX ring */
1079 		if (emac_rx_skb_size(ndev->mtu) != emac_rx_skb_size(new_mtu))
1080 			ret = emac_resize_rx_ring(dev, new_mtu);
1081 	}
1082 
1083 	if (!ret) {
1084 		ndev->mtu = new_mtu;
1085 		dev->rx_skb_size = emac_rx_skb_size(new_mtu);
1086 		dev->rx_sync_size = emac_rx_sync_size(new_mtu);
1087 	}
1088 
1089 	return ret;
1090 }
1091 
1092 static void emac_clean_tx_ring(struct emac_instance *dev)
1093 {
1094 	int i;
1095 
1096 	for (i = 0; i < NUM_TX_BUFF; ++i) {
1097 		if (dev->tx_skb[i]) {
1098 			dev_kfree_skb(dev->tx_skb[i]);
1099 			dev->tx_skb[i] = NULL;
1100 			if (dev->tx_desc[i].ctrl & MAL_TX_CTRL_READY)
1101 				++dev->estats.tx_dropped;
1102 		}
1103 		dev->tx_desc[i].ctrl = 0;
1104 		dev->tx_desc[i].data_ptr = 0;
1105 	}
1106 }
1107 
1108 static void emac_clean_rx_ring(struct emac_instance *dev)
1109 {
1110 	int i;
1111 
1112 	for (i = 0; i < NUM_RX_BUFF; ++i)
1113 		if (dev->rx_skb[i]) {
1114 			dev->rx_desc[i].ctrl = 0;
1115 			dev_kfree_skb(dev->rx_skb[i]);
1116 			dev->rx_skb[i] = NULL;
1117 			dev->rx_desc[i].data_ptr = 0;
1118 		}
1119 
1120 	if (dev->rx_sg_skb) {
1121 		dev_kfree_skb(dev->rx_sg_skb);
1122 		dev->rx_sg_skb = NULL;
1123 	}
1124 }
1125 
1126 static inline int emac_alloc_rx_skb(struct emac_instance *dev, int slot,
1127 				    gfp_t flags)
1128 {
1129 	struct sk_buff *skb = alloc_skb(dev->rx_skb_size, flags);
1130 	if (unlikely(!skb))
1131 		return -ENOMEM;
1132 
1133 	dev->rx_skb[slot] = skb;
1134 	dev->rx_desc[slot].data_len = 0;
1135 
1136 	skb_reserve(skb, EMAC_RX_SKB_HEADROOM + 2);
1137 	dev->rx_desc[slot].data_ptr =
1138 	    dma_map_single(&dev->ofdev->dev, skb->data - 2, dev->rx_sync_size,
1139 			   DMA_FROM_DEVICE) + 2;
1140 	wmb();
1141 	dev->rx_desc[slot].ctrl = MAL_RX_CTRL_EMPTY |
1142 	    (slot == (NUM_RX_BUFF - 1) ? MAL_RX_CTRL_WRAP : 0);
1143 
1144 	return 0;
1145 }
1146 
1147 static void emac_print_link_status(struct emac_instance *dev)
1148 {
1149 	if (netif_carrier_ok(dev->ndev))
1150 		printk(KERN_INFO "%s: link is up, %d %s%s\n",
1151 		       dev->ndev->name, dev->phy.speed,
1152 		       dev->phy.duplex == DUPLEX_FULL ? "FDX" : "HDX",
1153 		       dev->phy.pause ? ", pause enabled" :
1154 		       dev->phy.asym_pause ? ", asymmetric pause enabled" : "");
1155 	else
1156 		printk(KERN_INFO "%s: link is down\n", dev->ndev->name);
1157 }
1158 
1159 /* Process ctx, rtnl_lock semaphore */
1160 static int emac_open(struct net_device *ndev)
1161 {
1162 	struct emac_instance *dev = netdev_priv(ndev);
1163 	int err, i;
1164 
1165 	DBG(dev, "open" NL);
1166 
1167 	/* Setup error IRQ handler */
1168 	err = request_irq(dev->emac_irq, emac_irq, 0, "EMAC", dev);
1169 	if (err) {
1170 		printk(KERN_ERR "%s: failed to request IRQ %d\n",
1171 		       ndev->name, dev->emac_irq);
1172 		return err;
1173 	}
1174 
1175 	/* Allocate RX ring */
1176 	for (i = 0; i < NUM_RX_BUFF; ++i)
1177 		if (emac_alloc_rx_skb(dev, i, GFP_KERNEL)) {
1178 			printk(KERN_ERR "%s: failed to allocate RX ring\n",
1179 			       ndev->name);
1180 			goto oom;
1181 		}
1182 
1183 	dev->tx_cnt = dev->tx_slot = dev->ack_slot = dev->rx_slot = 0;
1184 	clear_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags);
1185 	dev->rx_sg_skb = NULL;
1186 
1187 	mutex_lock(&dev->link_lock);
1188 	dev->opened = 1;
1189 
1190 	/* Start PHY polling now.
1191 	 */
1192 	if (dev->phy.address >= 0) {
1193 		int link_poll_interval;
1194 		if (dev->phy.def->ops->poll_link(&dev->phy)) {
1195 			dev->phy.def->ops->read_link(&dev->phy);
1196 			emac_rx_clk_default(dev);
1197 			netif_carrier_on(dev->ndev);
1198 			link_poll_interval = PHY_POLL_LINK_ON;
1199 		} else {
1200 			emac_rx_clk_tx(dev);
1201 			netif_carrier_off(dev->ndev);
1202 			link_poll_interval = PHY_POLL_LINK_OFF;
1203 		}
1204 		dev->link_polling = 1;
1205 		wmb();
1206 		schedule_delayed_work(&dev->link_work, link_poll_interval);
1207 		emac_print_link_status(dev);
1208 	} else
1209 		netif_carrier_on(dev->ndev);
1210 
1211 	/* Required for Pause packet support in EMAC */
1212 	dev_mc_add_global(ndev, default_mcast_addr);
1213 
1214 	emac_configure(dev);
1215 	mal_poll_add(dev->mal, &dev->commac);
1216 	mal_enable_tx_channel(dev->mal, dev->mal_tx_chan);
1217 	mal_set_rcbs(dev->mal, dev->mal_rx_chan, emac_rx_size(ndev->mtu));
1218 	mal_enable_rx_channel(dev->mal, dev->mal_rx_chan);
1219 	emac_tx_enable(dev);
1220 	emac_rx_enable(dev);
1221 	emac_netif_start(dev);
1222 
1223 	mutex_unlock(&dev->link_lock);
1224 
1225 	return 0;
1226  oom:
1227 	emac_clean_rx_ring(dev);
1228 	free_irq(dev->emac_irq, dev);
1229 
1230 	return -ENOMEM;
1231 }
1232 
1233 /* BHs disabled */
1234 #if 0
1235 static int emac_link_differs(struct emac_instance *dev)
1236 {
1237 	u32 r = in_be32(&dev->emacp->mr1);
1238 
1239 	int duplex = r & EMAC_MR1_FDE ? DUPLEX_FULL : DUPLEX_HALF;
1240 	int speed, pause, asym_pause;
1241 
1242 	if (r & EMAC_MR1_MF_1000)
1243 		speed = SPEED_1000;
1244 	else if (r & EMAC_MR1_MF_100)
1245 		speed = SPEED_100;
1246 	else
1247 		speed = SPEED_10;
1248 
1249 	switch (r & (EMAC_MR1_EIFC | EMAC_MR1_APP)) {
1250 	case (EMAC_MR1_EIFC | EMAC_MR1_APP):
1251 		pause = 1;
1252 		asym_pause = 0;
1253 		break;
1254 	case EMAC_MR1_APP:
1255 		pause = 0;
1256 		asym_pause = 1;
1257 		break;
1258 	default:
1259 		pause = asym_pause = 0;
1260 	}
1261 	return speed != dev->phy.speed || duplex != dev->phy.duplex ||
1262 	    pause != dev->phy.pause || asym_pause != dev->phy.asym_pause;
1263 }
1264 #endif
1265 
1266 static void emac_link_timer(struct work_struct *work)
1267 {
1268 	struct emac_instance *dev =
1269 		container_of(to_delayed_work(work),
1270 			     struct emac_instance, link_work);
1271 	int link_poll_interval;
1272 
1273 	mutex_lock(&dev->link_lock);
1274 	DBG2(dev, "link timer" NL);
1275 
1276 	if (!dev->opened)
1277 		goto bail;
1278 
1279 	if (dev->phy.def->ops->poll_link(&dev->phy)) {
1280 		if (!netif_carrier_ok(dev->ndev)) {
1281 			emac_rx_clk_default(dev);
1282 			/* Get new link parameters */
1283 			dev->phy.def->ops->read_link(&dev->phy);
1284 
1285 			netif_carrier_on(dev->ndev);
1286 			emac_netif_stop(dev);
1287 			emac_full_tx_reset(dev);
1288 			emac_netif_start(dev);
1289 			emac_print_link_status(dev);
1290 		}
1291 		link_poll_interval = PHY_POLL_LINK_ON;
1292 	} else {
1293 		if (netif_carrier_ok(dev->ndev)) {
1294 			emac_rx_clk_tx(dev);
1295 			netif_carrier_off(dev->ndev);
1296 			netif_tx_disable(dev->ndev);
1297 			emac_reinitialize(dev);
1298 			emac_print_link_status(dev);
1299 		}
1300 		link_poll_interval = PHY_POLL_LINK_OFF;
1301 	}
1302 	schedule_delayed_work(&dev->link_work, link_poll_interval);
1303  bail:
1304 	mutex_unlock(&dev->link_lock);
1305 }
1306 
1307 static void emac_force_link_update(struct emac_instance *dev)
1308 {
1309 	netif_carrier_off(dev->ndev);
1310 	smp_rmb();
1311 	if (dev->link_polling) {
1312 		cancel_delayed_work_sync(&dev->link_work);
1313 		if (dev->link_polling)
1314 			schedule_delayed_work(&dev->link_work,  PHY_POLL_LINK_OFF);
1315 	}
1316 }
1317 
1318 /* Process ctx, rtnl_lock semaphore */
1319 static int emac_close(struct net_device *ndev)
1320 {
1321 	struct emac_instance *dev = netdev_priv(ndev);
1322 
1323 	DBG(dev, "close" NL);
1324 
1325 	if (dev->phy.address >= 0) {
1326 		dev->link_polling = 0;
1327 		cancel_delayed_work_sync(&dev->link_work);
1328 	}
1329 	mutex_lock(&dev->link_lock);
1330 	emac_netif_stop(dev);
1331 	dev->opened = 0;
1332 	mutex_unlock(&dev->link_lock);
1333 
1334 	emac_rx_disable(dev);
1335 	emac_tx_disable(dev);
1336 	mal_disable_rx_channel(dev->mal, dev->mal_rx_chan);
1337 	mal_disable_tx_channel(dev->mal, dev->mal_tx_chan);
1338 	mal_poll_del(dev->mal, &dev->commac);
1339 
1340 	emac_clean_tx_ring(dev);
1341 	emac_clean_rx_ring(dev);
1342 
1343 	free_irq(dev->emac_irq, dev);
1344 
1345 	netif_carrier_off(ndev);
1346 
1347 	return 0;
1348 }
1349 
1350 static inline u16 emac_tx_csum(struct emac_instance *dev,
1351 			       struct sk_buff *skb)
1352 {
1353 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH) &&
1354 		(skb->ip_summed == CHECKSUM_PARTIAL)) {
1355 		++dev->stats.tx_packets_csum;
1356 		return EMAC_TX_CTRL_TAH_CSUM;
1357 	}
1358 	return 0;
1359 }
1360 
1361 static inline int emac_xmit_finish(struct emac_instance *dev, int len)
1362 {
1363 	struct emac_regs __iomem *p = dev->emacp;
1364 	struct net_device *ndev = dev->ndev;
1365 
1366 	/* Send the packet out. If the if makes a significant perf
1367 	 * difference, then we can store the TMR0 value in "dev"
1368 	 * instead
1369 	 */
1370 	if (emac_has_feature(dev, EMAC_FTR_EMAC4))
1371 		out_be32(&p->tmr0, EMAC4_TMR0_XMIT);
1372 	else
1373 		out_be32(&p->tmr0, EMAC_TMR0_XMIT);
1374 
1375 	if (unlikely(++dev->tx_cnt == NUM_TX_BUFF)) {
1376 		netif_stop_queue(ndev);
1377 		DBG2(dev, "stopped TX queue" NL);
1378 	}
1379 
1380 	ndev->trans_start = jiffies;
1381 	++dev->stats.tx_packets;
1382 	dev->stats.tx_bytes += len;
1383 
1384 	return NETDEV_TX_OK;
1385 }
1386 
1387 /* Tx lock BH */
1388 static int emac_start_xmit(struct sk_buff *skb, struct net_device *ndev)
1389 {
1390 	struct emac_instance *dev = netdev_priv(ndev);
1391 	unsigned int len = skb->len;
1392 	int slot;
1393 
1394 	u16 ctrl = EMAC_TX_CTRL_GFCS | EMAC_TX_CTRL_GP | MAL_TX_CTRL_READY |
1395 	    MAL_TX_CTRL_LAST | emac_tx_csum(dev, skb);
1396 
1397 	slot = dev->tx_slot++;
1398 	if (dev->tx_slot == NUM_TX_BUFF) {
1399 		dev->tx_slot = 0;
1400 		ctrl |= MAL_TX_CTRL_WRAP;
1401 	}
1402 
1403 	DBG2(dev, "xmit(%u) %d" NL, len, slot);
1404 
1405 	dev->tx_skb[slot] = skb;
1406 	dev->tx_desc[slot].data_ptr = dma_map_single(&dev->ofdev->dev,
1407 						     skb->data, len,
1408 						     DMA_TO_DEVICE);
1409 	dev->tx_desc[slot].data_len = (u16) len;
1410 	wmb();
1411 	dev->tx_desc[slot].ctrl = ctrl;
1412 
1413 	return emac_xmit_finish(dev, len);
1414 }
1415 
1416 static inline int emac_xmit_split(struct emac_instance *dev, int slot,
1417 				  u32 pd, int len, int last, u16 base_ctrl)
1418 {
1419 	while (1) {
1420 		u16 ctrl = base_ctrl;
1421 		int chunk = min(len, MAL_MAX_TX_SIZE);
1422 		len -= chunk;
1423 
1424 		slot = (slot + 1) % NUM_TX_BUFF;
1425 
1426 		if (last && !len)
1427 			ctrl |= MAL_TX_CTRL_LAST;
1428 		if (slot == NUM_TX_BUFF - 1)
1429 			ctrl |= MAL_TX_CTRL_WRAP;
1430 
1431 		dev->tx_skb[slot] = NULL;
1432 		dev->tx_desc[slot].data_ptr = pd;
1433 		dev->tx_desc[slot].data_len = (u16) chunk;
1434 		dev->tx_desc[slot].ctrl = ctrl;
1435 		++dev->tx_cnt;
1436 
1437 		if (!len)
1438 			break;
1439 
1440 		pd += chunk;
1441 	}
1442 	return slot;
1443 }
1444 
1445 /* Tx lock BH disabled (SG version for TAH equipped EMACs) */
1446 static int emac_start_xmit_sg(struct sk_buff *skb, struct net_device *ndev)
1447 {
1448 	struct emac_instance *dev = netdev_priv(ndev);
1449 	int nr_frags = skb_shinfo(skb)->nr_frags;
1450 	int len = skb->len, chunk;
1451 	int slot, i;
1452 	u16 ctrl;
1453 	u32 pd;
1454 
1455 	/* This is common "fast" path */
1456 	if (likely(!nr_frags && len <= MAL_MAX_TX_SIZE))
1457 		return emac_start_xmit(skb, ndev);
1458 
1459 	len -= skb->data_len;
1460 
1461 	/* Note, this is only an *estimation*, we can still run out of empty
1462 	 * slots because of the additional fragmentation into
1463 	 * MAL_MAX_TX_SIZE-sized chunks
1464 	 */
1465 	if (unlikely(dev->tx_cnt + nr_frags + mal_tx_chunks(len) > NUM_TX_BUFF))
1466 		goto stop_queue;
1467 
1468 	ctrl = EMAC_TX_CTRL_GFCS | EMAC_TX_CTRL_GP | MAL_TX_CTRL_READY |
1469 	    emac_tx_csum(dev, skb);
1470 	slot = dev->tx_slot;
1471 
1472 	/* skb data */
1473 	dev->tx_skb[slot] = NULL;
1474 	chunk = min(len, MAL_MAX_TX_SIZE);
1475 	dev->tx_desc[slot].data_ptr = pd =
1476 	    dma_map_single(&dev->ofdev->dev, skb->data, len, DMA_TO_DEVICE);
1477 	dev->tx_desc[slot].data_len = (u16) chunk;
1478 	len -= chunk;
1479 	if (unlikely(len))
1480 		slot = emac_xmit_split(dev, slot, pd + chunk, len, !nr_frags,
1481 				       ctrl);
1482 	/* skb fragments */
1483 	for (i = 0; i < nr_frags; ++i) {
1484 		struct skb_frag_struct *frag = &skb_shinfo(skb)->frags[i];
1485 		len = skb_frag_size(frag);
1486 
1487 		if (unlikely(dev->tx_cnt + mal_tx_chunks(len) >= NUM_TX_BUFF))
1488 			goto undo_frame;
1489 
1490 		pd = skb_frag_dma_map(&dev->ofdev->dev, frag, 0, len,
1491 				      DMA_TO_DEVICE);
1492 
1493 		slot = emac_xmit_split(dev, slot, pd, len, i == nr_frags - 1,
1494 				       ctrl);
1495 	}
1496 
1497 	DBG2(dev, "xmit_sg(%u) %d - %d" NL, skb->len, dev->tx_slot, slot);
1498 
1499 	/* Attach skb to the last slot so we don't release it too early */
1500 	dev->tx_skb[slot] = skb;
1501 
1502 	/* Send the packet out */
1503 	if (dev->tx_slot == NUM_TX_BUFF - 1)
1504 		ctrl |= MAL_TX_CTRL_WRAP;
1505 	wmb();
1506 	dev->tx_desc[dev->tx_slot].ctrl = ctrl;
1507 	dev->tx_slot = (slot + 1) % NUM_TX_BUFF;
1508 
1509 	return emac_xmit_finish(dev, skb->len);
1510 
1511  undo_frame:
1512 	/* Well, too bad. Our previous estimation was overly optimistic.
1513 	 * Undo everything.
1514 	 */
1515 	while (slot != dev->tx_slot) {
1516 		dev->tx_desc[slot].ctrl = 0;
1517 		--dev->tx_cnt;
1518 		if (--slot < 0)
1519 			slot = NUM_TX_BUFF - 1;
1520 	}
1521 	++dev->estats.tx_undo;
1522 
1523  stop_queue:
1524 	netif_stop_queue(ndev);
1525 	DBG2(dev, "stopped TX queue" NL);
1526 	return NETDEV_TX_BUSY;
1527 }
1528 
1529 /* Tx lock BHs */
1530 static void emac_parse_tx_error(struct emac_instance *dev, u16 ctrl)
1531 {
1532 	struct emac_error_stats *st = &dev->estats;
1533 
1534 	DBG(dev, "BD TX error %04x" NL, ctrl);
1535 
1536 	++st->tx_bd_errors;
1537 	if (ctrl & EMAC_TX_ST_BFCS)
1538 		++st->tx_bd_bad_fcs;
1539 	if (ctrl & EMAC_TX_ST_LCS)
1540 		++st->tx_bd_carrier_loss;
1541 	if (ctrl & EMAC_TX_ST_ED)
1542 		++st->tx_bd_excessive_deferral;
1543 	if (ctrl & EMAC_TX_ST_EC)
1544 		++st->tx_bd_excessive_collisions;
1545 	if (ctrl & EMAC_TX_ST_LC)
1546 		++st->tx_bd_late_collision;
1547 	if (ctrl & EMAC_TX_ST_MC)
1548 		++st->tx_bd_multple_collisions;
1549 	if (ctrl & EMAC_TX_ST_SC)
1550 		++st->tx_bd_single_collision;
1551 	if (ctrl & EMAC_TX_ST_UR)
1552 		++st->tx_bd_underrun;
1553 	if (ctrl & EMAC_TX_ST_SQE)
1554 		++st->tx_bd_sqe;
1555 }
1556 
1557 static void emac_poll_tx(void *param)
1558 {
1559 	struct emac_instance *dev = param;
1560 	u32 bad_mask;
1561 
1562 	DBG2(dev, "poll_tx, %d %d" NL, dev->tx_cnt, dev->ack_slot);
1563 
1564 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH))
1565 		bad_mask = EMAC_IS_BAD_TX_TAH;
1566 	else
1567 		bad_mask = EMAC_IS_BAD_TX;
1568 
1569 	netif_tx_lock_bh(dev->ndev);
1570 	if (dev->tx_cnt) {
1571 		u16 ctrl;
1572 		int slot = dev->ack_slot, n = 0;
1573 	again:
1574 		ctrl = dev->tx_desc[slot].ctrl;
1575 		if (!(ctrl & MAL_TX_CTRL_READY)) {
1576 			struct sk_buff *skb = dev->tx_skb[slot];
1577 			++n;
1578 
1579 			if (skb) {
1580 				dev_kfree_skb(skb);
1581 				dev->tx_skb[slot] = NULL;
1582 			}
1583 			slot = (slot + 1) % NUM_TX_BUFF;
1584 
1585 			if (unlikely(ctrl & bad_mask))
1586 				emac_parse_tx_error(dev, ctrl);
1587 
1588 			if (--dev->tx_cnt)
1589 				goto again;
1590 		}
1591 		if (n) {
1592 			dev->ack_slot = slot;
1593 			if (netif_queue_stopped(dev->ndev) &&
1594 			    dev->tx_cnt < EMAC_TX_WAKEUP_THRESH)
1595 				netif_wake_queue(dev->ndev);
1596 
1597 			DBG2(dev, "tx %d pkts" NL, n);
1598 		}
1599 	}
1600 	netif_tx_unlock_bh(dev->ndev);
1601 }
1602 
1603 static inline void emac_recycle_rx_skb(struct emac_instance *dev, int slot,
1604 				       int len)
1605 {
1606 	struct sk_buff *skb = dev->rx_skb[slot];
1607 
1608 	DBG2(dev, "recycle %d %d" NL, slot, len);
1609 
1610 	if (len)
1611 		dma_map_single(&dev->ofdev->dev, skb->data - 2,
1612 			       EMAC_DMA_ALIGN(len + 2), DMA_FROM_DEVICE);
1613 
1614 	dev->rx_desc[slot].data_len = 0;
1615 	wmb();
1616 	dev->rx_desc[slot].ctrl = MAL_RX_CTRL_EMPTY |
1617 	    (slot == (NUM_RX_BUFF - 1) ? MAL_RX_CTRL_WRAP : 0);
1618 }
1619 
1620 static void emac_parse_rx_error(struct emac_instance *dev, u16 ctrl)
1621 {
1622 	struct emac_error_stats *st = &dev->estats;
1623 
1624 	DBG(dev, "BD RX error %04x" NL, ctrl);
1625 
1626 	++st->rx_bd_errors;
1627 	if (ctrl & EMAC_RX_ST_OE)
1628 		++st->rx_bd_overrun;
1629 	if (ctrl & EMAC_RX_ST_BP)
1630 		++st->rx_bd_bad_packet;
1631 	if (ctrl & EMAC_RX_ST_RP)
1632 		++st->rx_bd_runt_packet;
1633 	if (ctrl & EMAC_RX_ST_SE)
1634 		++st->rx_bd_short_event;
1635 	if (ctrl & EMAC_RX_ST_AE)
1636 		++st->rx_bd_alignment_error;
1637 	if (ctrl & EMAC_RX_ST_BFCS)
1638 		++st->rx_bd_bad_fcs;
1639 	if (ctrl & EMAC_RX_ST_PTL)
1640 		++st->rx_bd_packet_too_long;
1641 	if (ctrl & EMAC_RX_ST_ORE)
1642 		++st->rx_bd_out_of_range;
1643 	if (ctrl & EMAC_RX_ST_IRE)
1644 		++st->rx_bd_in_range;
1645 }
1646 
1647 static inline void emac_rx_csum(struct emac_instance *dev,
1648 				struct sk_buff *skb, u16 ctrl)
1649 {
1650 #ifdef CONFIG_IBM_EMAC_TAH
1651 	if (!ctrl && dev->tah_dev) {
1652 		skb->ip_summed = CHECKSUM_UNNECESSARY;
1653 		++dev->stats.rx_packets_csum;
1654 	}
1655 #endif
1656 }
1657 
1658 static inline int emac_rx_sg_append(struct emac_instance *dev, int slot)
1659 {
1660 	if (likely(dev->rx_sg_skb != NULL)) {
1661 		int len = dev->rx_desc[slot].data_len;
1662 		int tot_len = dev->rx_sg_skb->len + len;
1663 
1664 		if (unlikely(tot_len + 2 > dev->rx_skb_size)) {
1665 			++dev->estats.rx_dropped_mtu;
1666 			dev_kfree_skb(dev->rx_sg_skb);
1667 			dev->rx_sg_skb = NULL;
1668 		} else {
1669 			memcpy(skb_tail_pointer(dev->rx_sg_skb),
1670 					 dev->rx_skb[slot]->data, len);
1671 			skb_put(dev->rx_sg_skb, len);
1672 			emac_recycle_rx_skb(dev, slot, len);
1673 			return 0;
1674 		}
1675 	}
1676 	emac_recycle_rx_skb(dev, slot, 0);
1677 	return -1;
1678 }
1679 
1680 /* NAPI poll context */
1681 static int emac_poll_rx(void *param, int budget)
1682 {
1683 	struct emac_instance *dev = param;
1684 	int slot = dev->rx_slot, received = 0;
1685 
1686 	DBG2(dev, "poll_rx(%d)" NL, budget);
1687 
1688  again:
1689 	while (budget > 0) {
1690 		int len;
1691 		struct sk_buff *skb;
1692 		u16 ctrl = dev->rx_desc[slot].ctrl;
1693 
1694 		if (ctrl & MAL_RX_CTRL_EMPTY)
1695 			break;
1696 
1697 		skb = dev->rx_skb[slot];
1698 		mb();
1699 		len = dev->rx_desc[slot].data_len;
1700 
1701 		if (unlikely(!MAL_IS_SINGLE_RX(ctrl)))
1702 			goto sg;
1703 
1704 		ctrl &= EMAC_BAD_RX_MASK;
1705 		if (unlikely(ctrl && ctrl != EMAC_RX_TAH_BAD_CSUM)) {
1706 			emac_parse_rx_error(dev, ctrl);
1707 			++dev->estats.rx_dropped_error;
1708 			emac_recycle_rx_skb(dev, slot, 0);
1709 			len = 0;
1710 			goto next;
1711 		}
1712 
1713 		if (len < ETH_HLEN) {
1714 			++dev->estats.rx_dropped_stack;
1715 			emac_recycle_rx_skb(dev, slot, len);
1716 			goto next;
1717 		}
1718 
1719 		if (len && len < EMAC_RX_COPY_THRESH) {
1720 			struct sk_buff *copy_skb =
1721 			    alloc_skb(len + EMAC_RX_SKB_HEADROOM + 2, GFP_ATOMIC);
1722 			if (unlikely(!copy_skb))
1723 				goto oom;
1724 
1725 			skb_reserve(copy_skb, EMAC_RX_SKB_HEADROOM + 2);
1726 			memcpy(copy_skb->data - 2, skb->data - 2, len + 2);
1727 			emac_recycle_rx_skb(dev, slot, len);
1728 			skb = copy_skb;
1729 		} else if (unlikely(emac_alloc_rx_skb(dev, slot, GFP_ATOMIC)))
1730 			goto oom;
1731 
1732 		skb_put(skb, len);
1733 	push_packet:
1734 		skb->protocol = eth_type_trans(skb, dev->ndev);
1735 		emac_rx_csum(dev, skb, ctrl);
1736 
1737 		if (unlikely(netif_receive_skb(skb) == NET_RX_DROP))
1738 			++dev->estats.rx_dropped_stack;
1739 	next:
1740 		++dev->stats.rx_packets;
1741 	skip:
1742 		dev->stats.rx_bytes += len;
1743 		slot = (slot + 1) % NUM_RX_BUFF;
1744 		--budget;
1745 		++received;
1746 		continue;
1747 	sg:
1748 		if (ctrl & MAL_RX_CTRL_FIRST) {
1749 			BUG_ON(dev->rx_sg_skb);
1750 			if (unlikely(emac_alloc_rx_skb(dev, slot, GFP_ATOMIC))) {
1751 				DBG(dev, "rx OOM %d" NL, slot);
1752 				++dev->estats.rx_dropped_oom;
1753 				emac_recycle_rx_skb(dev, slot, 0);
1754 			} else {
1755 				dev->rx_sg_skb = skb;
1756 				skb_put(skb, len);
1757 			}
1758 		} else if (!emac_rx_sg_append(dev, slot) &&
1759 			   (ctrl & MAL_RX_CTRL_LAST)) {
1760 
1761 			skb = dev->rx_sg_skb;
1762 			dev->rx_sg_skb = NULL;
1763 
1764 			ctrl &= EMAC_BAD_RX_MASK;
1765 			if (unlikely(ctrl && ctrl != EMAC_RX_TAH_BAD_CSUM)) {
1766 				emac_parse_rx_error(dev, ctrl);
1767 				++dev->estats.rx_dropped_error;
1768 				dev_kfree_skb(skb);
1769 				len = 0;
1770 			} else
1771 				goto push_packet;
1772 		}
1773 		goto skip;
1774 	oom:
1775 		DBG(dev, "rx OOM %d" NL, slot);
1776 		/* Drop the packet and recycle skb */
1777 		++dev->estats.rx_dropped_oom;
1778 		emac_recycle_rx_skb(dev, slot, 0);
1779 		goto next;
1780 	}
1781 
1782 	if (received) {
1783 		DBG2(dev, "rx %d BDs" NL, received);
1784 		dev->rx_slot = slot;
1785 	}
1786 
1787 	if (unlikely(budget && test_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags))) {
1788 		mb();
1789 		if (!(dev->rx_desc[slot].ctrl & MAL_RX_CTRL_EMPTY)) {
1790 			DBG2(dev, "rx restart" NL);
1791 			received = 0;
1792 			goto again;
1793 		}
1794 
1795 		if (dev->rx_sg_skb) {
1796 			DBG2(dev, "dropping partial rx packet" NL);
1797 			++dev->estats.rx_dropped_error;
1798 			dev_kfree_skb(dev->rx_sg_skb);
1799 			dev->rx_sg_skb = NULL;
1800 		}
1801 
1802 		clear_bit(MAL_COMMAC_RX_STOPPED, &dev->commac.flags);
1803 		mal_enable_rx_channel(dev->mal, dev->mal_rx_chan);
1804 		emac_rx_enable(dev);
1805 		dev->rx_slot = 0;
1806 	}
1807 	return received;
1808 }
1809 
1810 /* NAPI poll context */
1811 static int emac_peek_rx(void *param)
1812 {
1813 	struct emac_instance *dev = param;
1814 
1815 	return !(dev->rx_desc[dev->rx_slot].ctrl & MAL_RX_CTRL_EMPTY);
1816 }
1817 
1818 /* NAPI poll context */
1819 static int emac_peek_rx_sg(void *param)
1820 {
1821 	struct emac_instance *dev = param;
1822 
1823 	int slot = dev->rx_slot;
1824 	while (1) {
1825 		u16 ctrl = dev->rx_desc[slot].ctrl;
1826 		if (ctrl & MAL_RX_CTRL_EMPTY)
1827 			return 0;
1828 		else if (ctrl & MAL_RX_CTRL_LAST)
1829 			return 1;
1830 
1831 		slot = (slot + 1) % NUM_RX_BUFF;
1832 
1833 		/* I'm just being paranoid here :) */
1834 		if (unlikely(slot == dev->rx_slot))
1835 			return 0;
1836 	}
1837 }
1838 
1839 /* Hard IRQ */
1840 static void emac_rxde(void *param)
1841 {
1842 	struct emac_instance *dev = param;
1843 
1844 	++dev->estats.rx_stopped;
1845 	emac_rx_disable_async(dev);
1846 }
1847 
1848 /* Hard IRQ */
1849 static irqreturn_t emac_irq(int irq, void *dev_instance)
1850 {
1851 	struct emac_instance *dev = dev_instance;
1852 	struct emac_regs __iomem *p = dev->emacp;
1853 	struct emac_error_stats *st = &dev->estats;
1854 	u32 isr;
1855 
1856 	spin_lock(&dev->lock);
1857 
1858 	isr = in_be32(&p->isr);
1859 	out_be32(&p->isr, isr);
1860 
1861 	DBG(dev, "isr = %08x" NL, isr);
1862 
1863 	if (isr & EMAC4_ISR_TXPE)
1864 		++st->tx_parity;
1865 	if (isr & EMAC4_ISR_RXPE)
1866 		++st->rx_parity;
1867 	if (isr & EMAC4_ISR_TXUE)
1868 		++st->tx_underrun;
1869 	if (isr & EMAC4_ISR_RXOE)
1870 		++st->rx_fifo_overrun;
1871 	if (isr & EMAC_ISR_OVR)
1872 		++st->rx_overrun;
1873 	if (isr & EMAC_ISR_BP)
1874 		++st->rx_bad_packet;
1875 	if (isr & EMAC_ISR_RP)
1876 		++st->rx_runt_packet;
1877 	if (isr & EMAC_ISR_SE)
1878 		++st->rx_short_event;
1879 	if (isr & EMAC_ISR_ALE)
1880 		++st->rx_alignment_error;
1881 	if (isr & EMAC_ISR_BFCS)
1882 		++st->rx_bad_fcs;
1883 	if (isr & EMAC_ISR_PTLE)
1884 		++st->rx_packet_too_long;
1885 	if (isr & EMAC_ISR_ORE)
1886 		++st->rx_out_of_range;
1887 	if (isr & EMAC_ISR_IRE)
1888 		++st->rx_in_range;
1889 	if (isr & EMAC_ISR_SQE)
1890 		++st->tx_sqe;
1891 	if (isr & EMAC_ISR_TE)
1892 		++st->tx_errors;
1893 
1894 	spin_unlock(&dev->lock);
1895 
1896 	return IRQ_HANDLED;
1897 }
1898 
1899 static struct net_device_stats *emac_stats(struct net_device *ndev)
1900 {
1901 	struct emac_instance *dev = netdev_priv(ndev);
1902 	struct emac_stats *st = &dev->stats;
1903 	struct emac_error_stats *est = &dev->estats;
1904 	struct net_device_stats *nst = &dev->nstats;
1905 	unsigned long flags;
1906 
1907 	DBG2(dev, "stats" NL);
1908 
1909 	/* Compute "legacy" statistics */
1910 	spin_lock_irqsave(&dev->lock, flags);
1911 	nst->rx_packets = (unsigned long)st->rx_packets;
1912 	nst->rx_bytes = (unsigned long)st->rx_bytes;
1913 	nst->tx_packets = (unsigned long)st->tx_packets;
1914 	nst->tx_bytes = (unsigned long)st->tx_bytes;
1915 	nst->rx_dropped = (unsigned long)(est->rx_dropped_oom +
1916 					  est->rx_dropped_error +
1917 					  est->rx_dropped_resize +
1918 					  est->rx_dropped_mtu);
1919 	nst->tx_dropped = (unsigned long)est->tx_dropped;
1920 
1921 	nst->rx_errors = (unsigned long)est->rx_bd_errors;
1922 	nst->rx_fifo_errors = (unsigned long)(est->rx_bd_overrun +
1923 					      est->rx_fifo_overrun +
1924 					      est->rx_overrun);
1925 	nst->rx_frame_errors = (unsigned long)(est->rx_bd_alignment_error +
1926 					       est->rx_alignment_error);
1927 	nst->rx_crc_errors = (unsigned long)(est->rx_bd_bad_fcs +
1928 					     est->rx_bad_fcs);
1929 	nst->rx_length_errors = (unsigned long)(est->rx_bd_runt_packet +
1930 						est->rx_bd_short_event +
1931 						est->rx_bd_packet_too_long +
1932 						est->rx_bd_out_of_range +
1933 						est->rx_bd_in_range +
1934 						est->rx_runt_packet +
1935 						est->rx_short_event +
1936 						est->rx_packet_too_long +
1937 						est->rx_out_of_range +
1938 						est->rx_in_range);
1939 
1940 	nst->tx_errors = (unsigned long)(est->tx_bd_errors + est->tx_errors);
1941 	nst->tx_fifo_errors = (unsigned long)(est->tx_bd_underrun +
1942 					      est->tx_underrun);
1943 	nst->tx_carrier_errors = (unsigned long)est->tx_bd_carrier_loss;
1944 	nst->collisions = (unsigned long)(est->tx_bd_excessive_deferral +
1945 					  est->tx_bd_excessive_collisions +
1946 					  est->tx_bd_late_collision +
1947 					  est->tx_bd_multple_collisions);
1948 	spin_unlock_irqrestore(&dev->lock, flags);
1949 	return nst;
1950 }
1951 
1952 static struct mal_commac_ops emac_commac_ops = {
1953 	.poll_tx = &emac_poll_tx,
1954 	.poll_rx = &emac_poll_rx,
1955 	.peek_rx = &emac_peek_rx,
1956 	.rxde = &emac_rxde,
1957 };
1958 
1959 static struct mal_commac_ops emac_commac_sg_ops = {
1960 	.poll_tx = &emac_poll_tx,
1961 	.poll_rx = &emac_poll_rx,
1962 	.peek_rx = &emac_peek_rx_sg,
1963 	.rxde = &emac_rxde,
1964 };
1965 
1966 /* Ethtool support */
1967 static int emac_ethtool_get_settings(struct net_device *ndev,
1968 				     struct ethtool_cmd *cmd)
1969 {
1970 	struct emac_instance *dev = netdev_priv(ndev);
1971 
1972 	cmd->supported = dev->phy.features;
1973 	cmd->port = PORT_MII;
1974 	cmd->phy_address = dev->phy.address;
1975 	cmd->transceiver =
1976 	    dev->phy.address >= 0 ? XCVR_EXTERNAL : XCVR_INTERNAL;
1977 
1978 	mutex_lock(&dev->link_lock);
1979 	cmd->advertising = dev->phy.advertising;
1980 	cmd->autoneg = dev->phy.autoneg;
1981 	cmd->speed = dev->phy.speed;
1982 	cmd->duplex = dev->phy.duplex;
1983 	mutex_unlock(&dev->link_lock);
1984 
1985 	return 0;
1986 }
1987 
1988 static int emac_ethtool_set_settings(struct net_device *ndev,
1989 				     struct ethtool_cmd *cmd)
1990 {
1991 	struct emac_instance *dev = netdev_priv(ndev);
1992 	u32 f = dev->phy.features;
1993 
1994 	DBG(dev, "set_settings(%d, %d, %d, 0x%08x)" NL,
1995 	    cmd->autoneg, cmd->speed, cmd->duplex, cmd->advertising);
1996 
1997 	/* Basic sanity checks */
1998 	if (dev->phy.address < 0)
1999 		return -EOPNOTSUPP;
2000 	if (cmd->autoneg != AUTONEG_ENABLE && cmd->autoneg != AUTONEG_DISABLE)
2001 		return -EINVAL;
2002 	if (cmd->autoneg == AUTONEG_ENABLE && cmd->advertising == 0)
2003 		return -EINVAL;
2004 	if (cmd->duplex != DUPLEX_HALF && cmd->duplex != DUPLEX_FULL)
2005 		return -EINVAL;
2006 
2007 	if (cmd->autoneg == AUTONEG_DISABLE) {
2008 		switch (cmd->speed) {
2009 		case SPEED_10:
2010 			if (cmd->duplex == DUPLEX_HALF &&
2011 			    !(f & SUPPORTED_10baseT_Half))
2012 				return -EINVAL;
2013 			if (cmd->duplex == DUPLEX_FULL &&
2014 			    !(f & SUPPORTED_10baseT_Full))
2015 				return -EINVAL;
2016 			break;
2017 		case SPEED_100:
2018 			if (cmd->duplex == DUPLEX_HALF &&
2019 			    !(f & SUPPORTED_100baseT_Half))
2020 				return -EINVAL;
2021 			if (cmd->duplex == DUPLEX_FULL &&
2022 			    !(f & SUPPORTED_100baseT_Full))
2023 				return -EINVAL;
2024 			break;
2025 		case SPEED_1000:
2026 			if (cmd->duplex == DUPLEX_HALF &&
2027 			    !(f & SUPPORTED_1000baseT_Half))
2028 				return -EINVAL;
2029 			if (cmd->duplex == DUPLEX_FULL &&
2030 			    !(f & SUPPORTED_1000baseT_Full))
2031 				return -EINVAL;
2032 			break;
2033 		default:
2034 			return -EINVAL;
2035 		}
2036 
2037 		mutex_lock(&dev->link_lock);
2038 		dev->phy.def->ops->setup_forced(&dev->phy, cmd->speed,
2039 						cmd->duplex);
2040 		mutex_unlock(&dev->link_lock);
2041 
2042 	} else {
2043 		if (!(f & SUPPORTED_Autoneg))
2044 			return -EINVAL;
2045 
2046 		mutex_lock(&dev->link_lock);
2047 		dev->phy.def->ops->setup_aneg(&dev->phy,
2048 					      (cmd->advertising & f) |
2049 					      (dev->phy.advertising &
2050 					       (ADVERTISED_Pause |
2051 						ADVERTISED_Asym_Pause)));
2052 		mutex_unlock(&dev->link_lock);
2053 	}
2054 	emac_force_link_update(dev);
2055 
2056 	return 0;
2057 }
2058 
2059 static void emac_ethtool_get_ringparam(struct net_device *ndev,
2060 				       struct ethtool_ringparam *rp)
2061 {
2062 	rp->rx_max_pending = rp->rx_pending = NUM_RX_BUFF;
2063 	rp->tx_max_pending = rp->tx_pending = NUM_TX_BUFF;
2064 }
2065 
2066 static void emac_ethtool_get_pauseparam(struct net_device *ndev,
2067 					struct ethtool_pauseparam *pp)
2068 {
2069 	struct emac_instance *dev = netdev_priv(ndev);
2070 
2071 	mutex_lock(&dev->link_lock);
2072 	if ((dev->phy.features & SUPPORTED_Autoneg) &&
2073 	    (dev->phy.advertising & (ADVERTISED_Pause | ADVERTISED_Asym_Pause)))
2074 		pp->autoneg = 1;
2075 
2076 	if (dev->phy.duplex == DUPLEX_FULL) {
2077 		if (dev->phy.pause)
2078 			pp->rx_pause = pp->tx_pause = 1;
2079 		else if (dev->phy.asym_pause)
2080 			pp->tx_pause = 1;
2081 	}
2082 	mutex_unlock(&dev->link_lock);
2083 }
2084 
2085 static int emac_get_regs_len(struct emac_instance *dev)
2086 {
2087 		return sizeof(struct emac_ethtool_regs_subhdr) +
2088 			sizeof(struct emac_regs);
2089 }
2090 
2091 static int emac_ethtool_get_regs_len(struct net_device *ndev)
2092 {
2093 	struct emac_instance *dev = netdev_priv(ndev);
2094 	int size;
2095 
2096 	size = sizeof(struct emac_ethtool_regs_hdr) +
2097 		emac_get_regs_len(dev) + mal_get_regs_len(dev->mal);
2098 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
2099 		size += zmii_get_regs_len(dev->zmii_dev);
2100 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
2101 		size += rgmii_get_regs_len(dev->rgmii_dev);
2102 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH))
2103 		size += tah_get_regs_len(dev->tah_dev);
2104 
2105 	return size;
2106 }
2107 
2108 static void *emac_dump_regs(struct emac_instance *dev, void *buf)
2109 {
2110 	struct emac_ethtool_regs_subhdr *hdr = buf;
2111 
2112 	hdr->index = dev->cell_index;
2113 	if (emac_has_feature(dev, EMAC_FTR_EMAC4SYNC)) {
2114 		hdr->version = EMAC4SYNC_ETHTOOL_REGS_VER;
2115 	} else if (emac_has_feature(dev, EMAC_FTR_EMAC4)) {
2116 		hdr->version = EMAC4_ETHTOOL_REGS_VER;
2117 	} else {
2118 		hdr->version = EMAC_ETHTOOL_REGS_VER;
2119 	}
2120 	memcpy_fromio(hdr + 1, dev->emacp, sizeof(struct emac_regs));
2121 	return (void *)(hdr + 1) + sizeof(struct emac_regs);
2122 }
2123 
2124 static void emac_ethtool_get_regs(struct net_device *ndev,
2125 				  struct ethtool_regs *regs, void *buf)
2126 {
2127 	struct emac_instance *dev = netdev_priv(ndev);
2128 	struct emac_ethtool_regs_hdr *hdr = buf;
2129 
2130 	hdr->components = 0;
2131 	buf = hdr + 1;
2132 
2133 	buf = mal_dump_regs(dev->mal, buf);
2134 	buf = emac_dump_regs(dev, buf);
2135 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII)) {
2136 		hdr->components |= EMAC_ETHTOOL_REGS_ZMII;
2137 		buf = zmii_dump_regs(dev->zmii_dev, buf);
2138 	}
2139 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII)) {
2140 		hdr->components |= EMAC_ETHTOOL_REGS_RGMII;
2141 		buf = rgmii_dump_regs(dev->rgmii_dev, buf);
2142 	}
2143 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH)) {
2144 		hdr->components |= EMAC_ETHTOOL_REGS_TAH;
2145 		buf = tah_dump_regs(dev->tah_dev, buf);
2146 	}
2147 }
2148 
2149 static int emac_ethtool_nway_reset(struct net_device *ndev)
2150 {
2151 	struct emac_instance *dev = netdev_priv(ndev);
2152 	int res = 0;
2153 
2154 	DBG(dev, "nway_reset" NL);
2155 
2156 	if (dev->phy.address < 0)
2157 		return -EOPNOTSUPP;
2158 
2159 	mutex_lock(&dev->link_lock);
2160 	if (!dev->phy.autoneg) {
2161 		res = -EINVAL;
2162 		goto out;
2163 	}
2164 
2165 	dev->phy.def->ops->setup_aneg(&dev->phy, dev->phy.advertising);
2166  out:
2167 	mutex_unlock(&dev->link_lock);
2168 	emac_force_link_update(dev);
2169 	return res;
2170 }
2171 
2172 static int emac_ethtool_get_sset_count(struct net_device *ndev, int stringset)
2173 {
2174 	if (stringset == ETH_SS_STATS)
2175 		return EMAC_ETHTOOL_STATS_COUNT;
2176 	else
2177 		return -EINVAL;
2178 }
2179 
2180 static void emac_ethtool_get_strings(struct net_device *ndev, u32 stringset,
2181 				     u8 * buf)
2182 {
2183 	if (stringset == ETH_SS_STATS)
2184 		memcpy(buf, &emac_stats_keys, sizeof(emac_stats_keys));
2185 }
2186 
2187 static void emac_ethtool_get_ethtool_stats(struct net_device *ndev,
2188 					   struct ethtool_stats *estats,
2189 					   u64 * tmp_stats)
2190 {
2191 	struct emac_instance *dev = netdev_priv(ndev);
2192 
2193 	memcpy(tmp_stats, &dev->stats, sizeof(dev->stats));
2194 	tmp_stats += sizeof(dev->stats) / sizeof(u64);
2195 	memcpy(tmp_stats, &dev->estats, sizeof(dev->estats));
2196 }
2197 
2198 static void emac_ethtool_get_drvinfo(struct net_device *ndev,
2199 				     struct ethtool_drvinfo *info)
2200 {
2201 	struct emac_instance *dev = netdev_priv(ndev);
2202 
2203 	strlcpy(info->driver, "ibm_emac", sizeof(info->driver));
2204 	strlcpy(info->version, DRV_VERSION, sizeof(info->version));
2205 	snprintf(info->bus_info, sizeof(info->bus_info), "PPC 4xx EMAC-%d %s",
2206 		 dev->cell_index, dev->ofdev->dev.of_node->full_name);
2207 	info->regdump_len = emac_ethtool_get_regs_len(ndev);
2208 }
2209 
2210 static const struct ethtool_ops emac_ethtool_ops = {
2211 	.get_settings = emac_ethtool_get_settings,
2212 	.set_settings = emac_ethtool_set_settings,
2213 	.get_drvinfo = emac_ethtool_get_drvinfo,
2214 
2215 	.get_regs_len = emac_ethtool_get_regs_len,
2216 	.get_regs = emac_ethtool_get_regs,
2217 
2218 	.nway_reset = emac_ethtool_nway_reset,
2219 
2220 	.get_ringparam = emac_ethtool_get_ringparam,
2221 	.get_pauseparam = emac_ethtool_get_pauseparam,
2222 
2223 	.get_strings = emac_ethtool_get_strings,
2224 	.get_sset_count = emac_ethtool_get_sset_count,
2225 	.get_ethtool_stats = emac_ethtool_get_ethtool_stats,
2226 
2227 	.get_link = ethtool_op_get_link,
2228 };
2229 
2230 static int emac_ioctl(struct net_device *ndev, struct ifreq *rq, int cmd)
2231 {
2232 	struct emac_instance *dev = netdev_priv(ndev);
2233 	struct mii_ioctl_data *data = if_mii(rq);
2234 
2235 	DBG(dev, "ioctl %08x" NL, cmd);
2236 
2237 	if (dev->phy.address < 0)
2238 		return -EOPNOTSUPP;
2239 
2240 	switch (cmd) {
2241 	case SIOCGMIIPHY:
2242 		data->phy_id = dev->phy.address;
2243 		/* Fall through */
2244 	case SIOCGMIIREG:
2245 		data->val_out = emac_mdio_read(ndev, dev->phy.address,
2246 					       data->reg_num);
2247 		return 0;
2248 
2249 	case SIOCSMIIREG:
2250 		emac_mdio_write(ndev, dev->phy.address, data->reg_num,
2251 				data->val_in);
2252 		return 0;
2253 	default:
2254 		return -EOPNOTSUPP;
2255 	}
2256 }
2257 
2258 struct emac_depentry {
2259 	u32			phandle;
2260 	struct device_node	*node;
2261 	struct platform_device	*ofdev;
2262 	void			*drvdata;
2263 };
2264 
2265 #define	EMAC_DEP_MAL_IDX	0
2266 #define	EMAC_DEP_ZMII_IDX	1
2267 #define	EMAC_DEP_RGMII_IDX	2
2268 #define	EMAC_DEP_TAH_IDX	3
2269 #define	EMAC_DEP_MDIO_IDX	4
2270 #define	EMAC_DEP_PREV_IDX	5
2271 #define	EMAC_DEP_COUNT		6
2272 
2273 static int emac_check_deps(struct emac_instance *dev,
2274 			   struct emac_depentry *deps)
2275 {
2276 	int i, there = 0;
2277 	struct device_node *np;
2278 
2279 	for (i = 0; i < EMAC_DEP_COUNT; i++) {
2280 		/* no dependency on that item, allright */
2281 		if (deps[i].phandle == 0) {
2282 			there++;
2283 			continue;
2284 		}
2285 		/* special case for blist as the dependency might go away */
2286 		if (i == EMAC_DEP_PREV_IDX) {
2287 			np = *(dev->blist - 1);
2288 			if (np == NULL) {
2289 				deps[i].phandle = 0;
2290 				there++;
2291 				continue;
2292 			}
2293 			if (deps[i].node == NULL)
2294 				deps[i].node = of_node_get(np);
2295 		}
2296 		if (deps[i].node == NULL)
2297 			deps[i].node = of_find_node_by_phandle(deps[i].phandle);
2298 		if (deps[i].node == NULL)
2299 			continue;
2300 		if (deps[i].ofdev == NULL)
2301 			deps[i].ofdev = of_find_device_by_node(deps[i].node);
2302 		if (deps[i].ofdev == NULL)
2303 			continue;
2304 		if (deps[i].drvdata == NULL)
2305 			deps[i].drvdata = platform_get_drvdata(deps[i].ofdev);
2306 		if (deps[i].drvdata != NULL)
2307 			there++;
2308 	}
2309 	return there == EMAC_DEP_COUNT;
2310 }
2311 
2312 static void emac_put_deps(struct emac_instance *dev)
2313 {
2314 	of_dev_put(dev->mal_dev);
2315 	of_dev_put(dev->zmii_dev);
2316 	of_dev_put(dev->rgmii_dev);
2317 	of_dev_put(dev->mdio_dev);
2318 	of_dev_put(dev->tah_dev);
2319 }
2320 
2321 static int emac_of_bus_notify(struct notifier_block *nb, unsigned long action,
2322 			      void *data)
2323 {
2324 	/* We are only intereted in device addition */
2325 	if (action == BUS_NOTIFY_BOUND_DRIVER)
2326 		wake_up_all(&emac_probe_wait);
2327 	return 0;
2328 }
2329 
2330 static struct notifier_block emac_of_bus_notifier = {
2331 	.notifier_call = emac_of_bus_notify
2332 };
2333 
2334 static int emac_wait_deps(struct emac_instance *dev)
2335 {
2336 	struct emac_depentry deps[EMAC_DEP_COUNT];
2337 	int i, err;
2338 
2339 	memset(&deps, 0, sizeof(deps));
2340 
2341 	deps[EMAC_DEP_MAL_IDX].phandle = dev->mal_ph;
2342 	deps[EMAC_DEP_ZMII_IDX].phandle = dev->zmii_ph;
2343 	deps[EMAC_DEP_RGMII_IDX].phandle = dev->rgmii_ph;
2344 	if (dev->tah_ph)
2345 		deps[EMAC_DEP_TAH_IDX].phandle = dev->tah_ph;
2346 	if (dev->mdio_ph)
2347 		deps[EMAC_DEP_MDIO_IDX].phandle = dev->mdio_ph;
2348 	if (dev->blist && dev->blist > emac_boot_list)
2349 		deps[EMAC_DEP_PREV_IDX].phandle = 0xffffffffu;
2350 	bus_register_notifier(&platform_bus_type, &emac_of_bus_notifier);
2351 	wait_event_timeout(emac_probe_wait,
2352 			   emac_check_deps(dev, deps),
2353 			   EMAC_PROBE_DEP_TIMEOUT);
2354 	bus_unregister_notifier(&platform_bus_type, &emac_of_bus_notifier);
2355 	err = emac_check_deps(dev, deps) ? 0 : -ENODEV;
2356 	for (i = 0; i < EMAC_DEP_COUNT; i++) {
2357 		of_node_put(deps[i].node);
2358 		if (err)
2359 			of_dev_put(deps[i].ofdev);
2360 	}
2361 	if (err == 0) {
2362 		dev->mal_dev = deps[EMAC_DEP_MAL_IDX].ofdev;
2363 		dev->zmii_dev = deps[EMAC_DEP_ZMII_IDX].ofdev;
2364 		dev->rgmii_dev = deps[EMAC_DEP_RGMII_IDX].ofdev;
2365 		dev->tah_dev = deps[EMAC_DEP_TAH_IDX].ofdev;
2366 		dev->mdio_dev = deps[EMAC_DEP_MDIO_IDX].ofdev;
2367 	}
2368 	of_dev_put(deps[EMAC_DEP_PREV_IDX].ofdev);
2369 	return err;
2370 }
2371 
2372 static int emac_read_uint_prop(struct device_node *np, const char *name,
2373 			       u32 *val, int fatal)
2374 {
2375 	int len;
2376 	const u32 *prop = of_get_property(np, name, &len);
2377 	if (prop == NULL || len < sizeof(u32)) {
2378 		if (fatal)
2379 			printk(KERN_ERR "%s: missing %s property\n",
2380 			       np->full_name, name);
2381 		return -ENODEV;
2382 	}
2383 	*val = *prop;
2384 	return 0;
2385 }
2386 
2387 static int emac_init_phy(struct emac_instance *dev)
2388 {
2389 	struct device_node *np = dev->ofdev->dev.of_node;
2390 	struct net_device *ndev = dev->ndev;
2391 	u32 phy_map, adv;
2392 	int i;
2393 
2394 	dev->phy.dev = ndev;
2395 	dev->phy.mode = dev->phy_mode;
2396 
2397 	/* PHY-less configuration.
2398 	 * XXX I probably should move these settings to the dev tree
2399 	 */
2400 	if (dev->phy_address == 0xffffffff && dev->phy_map == 0xffffffff) {
2401 		emac_reset(dev);
2402 
2403 		/* PHY-less configuration.
2404 		 * XXX I probably should move these settings to the dev tree
2405 		 */
2406 		dev->phy.address = -1;
2407 		dev->phy.features = SUPPORTED_MII;
2408 		if (emac_phy_supports_gige(dev->phy_mode))
2409 			dev->phy.features |= SUPPORTED_1000baseT_Full;
2410 		else
2411 			dev->phy.features |= SUPPORTED_100baseT_Full;
2412 		dev->phy.pause = 1;
2413 
2414 		return 0;
2415 	}
2416 
2417 	mutex_lock(&emac_phy_map_lock);
2418 	phy_map = dev->phy_map | busy_phy_map;
2419 
2420 	DBG(dev, "PHY maps %08x %08x" NL, dev->phy_map, busy_phy_map);
2421 
2422 	dev->phy.mdio_read = emac_mdio_read;
2423 	dev->phy.mdio_write = emac_mdio_write;
2424 
2425 	/* Enable internal clock source */
2426 #ifdef CONFIG_PPC_DCR_NATIVE
2427 	if (emac_has_feature(dev, EMAC_FTR_440GX_PHY_CLK_FIX))
2428 		dcri_clrset(SDR0, SDR0_MFR, 0, SDR0_MFR_ECS);
2429 #endif
2430 	/* PHY clock workaround */
2431 	emac_rx_clk_tx(dev);
2432 
2433 	/* Enable internal clock source on 440GX*/
2434 #ifdef CONFIG_PPC_DCR_NATIVE
2435 	if (emac_has_feature(dev, EMAC_FTR_440GX_PHY_CLK_FIX))
2436 		dcri_clrset(SDR0, SDR0_MFR, 0, SDR0_MFR_ECS);
2437 #endif
2438 	/* Configure EMAC with defaults so we can at least use MDIO
2439 	 * This is needed mostly for 440GX
2440 	 */
2441 	if (emac_phy_gpcs(dev->phy.mode)) {
2442 		/* XXX
2443 		 * Make GPCS PHY address equal to EMAC index.
2444 		 * We probably should take into account busy_phy_map
2445 		 * and/or phy_map here.
2446 		 *
2447 		 * Note that the busy_phy_map is currently global
2448 		 * while it should probably be per-ASIC...
2449 		 */
2450 		dev->phy.gpcs_address = dev->gpcs_address;
2451 		if (dev->phy.gpcs_address == 0xffffffff)
2452 			dev->phy.address = dev->cell_index;
2453 	}
2454 
2455 	emac_configure(dev);
2456 
2457 	if (dev->phy_address != 0xffffffff)
2458 		phy_map = ~(1 << dev->phy_address);
2459 
2460 	for (i = 0; i < 0x20; phy_map >>= 1, ++i)
2461 		if (!(phy_map & 1)) {
2462 			int r;
2463 			busy_phy_map |= 1 << i;
2464 
2465 			/* Quick check if there is a PHY at the address */
2466 			r = emac_mdio_read(dev->ndev, i, MII_BMCR);
2467 			if (r == 0xffff || r < 0)
2468 				continue;
2469 			if (!emac_mii_phy_probe(&dev->phy, i))
2470 				break;
2471 		}
2472 
2473 	/* Enable external clock source */
2474 #ifdef CONFIG_PPC_DCR_NATIVE
2475 	if (emac_has_feature(dev, EMAC_FTR_440GX_PHY_CLK_FIX))
2476 		dcri_clrset(SDR0, SDR0_MFR, SDR0_MFR_ECS, 0);
2477 #endif
2478 	mutex_unlock(&emac_phy_map_lock);
2479 	if (i == 0x20) {
2480 		printk(KERN_WARNING "%s: can't find PHY!\n", np->full_name);
2481 		return -ENXIO;
2482 	}
2483 
2484 	/* Init PHY */
2485 	if (dev->phy.def->ops->init)
2486 		dev->phy.def->ops->init(&dev->phy);
2487 
2488 	/* Disable any PHY features not supported by the platform */
2489 	dev->phy.def->features &= ~dev->phy_feat_exc;
2490 	dev->phy.features &= ~dev->phy_feat_exc;
2491 
2492 	/* Setup initial link parameters */
2493 	if (dev->phy.features & SUPPORTED_Autoneg) {
2494 		adv = dev->phy.features;
2495 		if (!emac_has_feature(dev, EMAC_FTR_NO_FLOW_CONTROL_40x))
2496 			adv |= ADVERTISED_Pause | ADVERTISED_Asym_Pause;
2497 		/* Restart autonegotiation */
2498 		dev->phy.def->ops->setup_aneg(&dev->phy, adv);
2499 	} else {
2500 		u32 f = dev->phy.def->features;
2501 		int speed = SPEED_10, fd = DUPLEX_HALF;
2502 
2503 		/* Select highest supported speed/duplex */
2504 		if (f & SUPPORTED_1000baseT_Full) {
2505 			speed = SPEED_1000;
2506 			fd = DUPLEX_FULL;
2507 		} else if (f & SUPPORTED_1000baseT_Half)
2508 			speed = SPEED_1000;
2509 		else if (f & SUPPORTED_100baseT_Full) {
2510 			speed = SPEED_100;
2511 			fd = DUPLEX_FULL;
2512 		} else if (f & SUPPORTED_100baseT_Half)
2513 			speed = SPEED_100;
2514 		else if (f & SUPPORTED_10baseT_Full)
2515 			fd = DUPLEX_FULL;
2516 
2517 		/* Force link parameters */
2518 		dev->phy.def->ops->setup_forced(&dev->phy, speed, fd);
2519 	}
2520 	return 0;
2521 }
2522 
2523 static int emac_init_config(struct emac_instance *dev)
2524 {
2525 	struct device_node *np = dev->ofdev->dev.of_node;
2526 	const void *p;
2527 
2528 	/* Read config from device-tree */
2529 	if (emac_read_uint_prop(np, "mal-device", &dev->mal_ph, 1))
2530 		return -ENXIO;
2531 	if (emac_read_uint_prop(np, "mal-tx-channel", &dev->mal_tx_chan, 1))
2532 		return -ENXIO;
2533 	if (emac_read_uint_prop(np, "mal-rx-channel", &dev->mal_rx_chan, 1))
2534 		return -ENXIO;
2535 	if (emac_read_uint_prop(np, "cell-index", &dev->cell_index, 1))
2536 		return -ENXIO;
2537 	if (emac_read_uint_prop(np, "max-frame-size", &dev->max_mtu, 0))
2538 		dev->max_mtu = 1500;
2539 	if (emac_read_uint_prop(np, "rx-fifo-size", &dev->rx_fifo_size, 0))
2540 		dev->rx_fifo_size = 2048;
2541 	if (emac_read_uint_prop(np, "tx-fifo-size", &dev->tx_fifo_size, 0))
2542 		dev->tx_fifo_size = 2048;
2543 	if (emac_read_uint_prop(np, "rx-fifo-size-gige", &dev->rx_fifo_size_gige, 0))
2544 		dev->rx_fifo_size_gige = dev->rx_fifo_size;
2545 	if (emac_read_uint_prop(np, "tx-fifo-size-gige", &dev->tx_fifo_size_gige, 0))
2546 		dev->tx_fifo_size_gige = dev->tx_fifo_size;
2547 	if (emac_read_uint_prop(np, "phy-address", &dev->phy_address, 0))
2548 		dev->phy_address = 0xffffffff;
2549 	if (emac_read_uint_prop(np, "phy-map", &dev->phy_map, 0))
2550 		dev->phy_map = 0xffffffff;
2551 	if (emac_read_uint_prop(np, "gpcs-address", &dev->gpcs_address, 0))
2552 		dev->gpcs_address = 0xffffffff;
2553 	if (emac_read_uint_prop(np->parent, "clock-frequency", &dev->opb_bus_freq, 1))
2554 		return -ENXIO;
2555 	if (emac_read_uint_prop(np, "tah-device", &dev->tah_ph, 0))
2556 		dev->tah_ph = 0;
2557 	if (emac_read_uint_prop(np, "tah-channel", &dev->tah_port, 0))
2558 		dev->tah_port = 0;
2559 	if (emac_read_uint_prop(np, "mdio-device", &dev->mdio_ph, 0))
2560 		dev->mdio_ph = 0;
2561 	if (emac_read_uint_prop(np, "zmii-device", &dev->zmii_ph, 0))
2562 		dev->zmii_ph = 0;
2563 	if (emac_read_uint_prop(np, "zmii-channel", &dev->zmii_port, 0))
2564 		dev->zmii_port = 0xffffffff;
2565 	if (emac_read_uint_prop(np, "rgmii-device", &dev->rgmii_ph, 0))
2566 		dev->rgmii_ph = 0;
2567 	if (emac_read_uint_prop(np, "rgmii-channel", &dev->rgmii_port, 0))
2568 		dev->rgmii_port = 0xffffffff;
2569 	if (emac_read_uint_prop(np, "fifo-entry-size", &dev->fifo_entry_size, 0))
2570 		dev->fifo_entry_size = 16;
2571 	if (emac_read_uint_prop(np, "mal-burst-size", &dev->mal_burst_size, 0))
2572 		dev->mal_burst_size = 256;
2573 
2574 	/* PHY mode needs some decoding */
2575 	dev->phy_mode = of_get_phy_mode(np);
2576 	if (dev->phy_mode < 0)
2577 		dev->phy_mode = PHY_MODE_NA;
2578 
2579 	/* Check EMAC version */
2580 	if (of_device_is_compatible(np, "ibm,emac4sync")) {
2581 		dev->features |= (EMAC_FTR_EMAC4 | EMAC_FTR_EMAC4SYNC);
2582 		if (of_device_is_compatible(np, "ibm,emac-460ex") ||
2583 		    of_device_is_compatible(np, "ibm,emac-460gt"))
2584 			dev->features |= EMAC_FTR_460EX_PHY_CLK_FIX;
2585 		if (of_device_is_compatible(np, "ibm,emac-405ex") ||
2586 		    of_device_is_compatible(np, "ibm,emac-405exr"))
2587 			dev->features |= EMAC_FTR_440EP_PHY_CLK_FIX;
2588 		if (of_device_is_compatible(np, "ibm,emac-apm821xx")) {
2589 			dev->features |= (EMAC_APM821XX_REQ_JUMBO_FRAME_SIZE |
2590 					  EMAC_FTR_APM821XX_NO_HALF_DUPLEX |
2591 					  EMAC_FTR_460EX_PHY_CLK_FIX);
2592 		}
2593 	} else if (of_device_is_compatible(np, "ibm,emac4")) {
2594 		dev->features |= EMAC_FTR_EMAC4;
2595 		if (of_device_is_compatible(np, "ibm,emac-440gx"))
2596 			dev->features |= EMAC_FTR_440GX_PHY_CLK_FIX;
2597 	} else {
2598 		if (of_device_is_compatible(np, "ibm,emac-440ep") ||
2599 		    of_device_is_compatible(np, "ibm,emac-440gr"))
2600 			dev->features |= EMAC_FTR_440EP_PHY_CLK_FIX;
2601 		if (of_device_is_compatible(np, "ibm,emac-405ez")) {
2602 #ifdef CONFIG_IBM_EMAC_NO_FLOW_CTRL
2603 			dev->features |= EMAC_FTR_NO_FLOW_CONTROL_40x;
2604 #else
2605 			printk(KERN_ERR "%s: Flow control not disabled!\n",
2606 					np->full_name);
2607 			return -ENXIO;
2608 #endif
2609 		}
2610 
2611 	}
2612 
2613 	/* Fixup some feature bits based on the device tree */
2614 	if (of_get_property(np, "has-inverted-stacr-oc", NULL))
2615 		dev->features |= EMAC_FTR_STACR_OC_INVERT;
2616 	if (of_get_property(np, "has-new-stacr-staopc", NULL))
2617 		dev->features |= EMAC_FTR_HAS_NEW_STACR;
2618 
2619 	/* CAB lacks the appropriate properties */
2620 	if (of_device_is_compatible(np, "ibm,emac-axon"))
2621 		dev->features |= EMAC_FTR_HAS_NEW_STACR |
2622 			EMAC_FTR_STACR_OC_INVERT;
2623 
2624 	/* Enable TAH/ZMII/RGMII features as found */
2625 	if (dev->tah_ph != 0) {
2626 #ifdef CONFIG_IBM_EMAC_TAH
2627 		dev->features |= EMAC_FTR_HAS_TAH;
2628 #else
2629 		printk(KERN_ERR "%s: TAH support not enabled !\n",
2630 		       np->full_name);
2631 		return -ENXIO;
2632 #endif
2633 	}
2634 
2635 	if (dev->zmii_ph != 0) {
2636 #ifdef CONFIG_IBM_EMAC_ZMII
2637 		dev->features |= EMAC_FTR_HAS_ZMII;
2638 #else
2639 		printk(KERN_ERR "%s: ZMII support not enabled !\n",
2640 		       np->full_name);
2641 		return -ENXIO;
2642 #endif
2643 	}
2644 
2645 	if (dev->rgmii_ph != 0) {
2646 #ifdef CONFIG_IBM_EMAC_RGMII
2647 		dev->features |= EMAC_FTR_HAS_RGMII;
2648 #else
2649 		printk(KERN_ERR "%s: RGMII support not enabled !\n",
2650 		       np->full_name);
2651 		return -ENXIO;
2652 #endif
2653 	}
2654 
2655 	/* Read MAC-address */
2656 	p = of_get_property(np, "local-mac-address", NULL);
2657 	if (p == NULL) {
2658 		printk(KERN_ERR "%s: Can't find local-mac-address property\n",
2659 		       np->full_name);
2660 		return -ENXIO;
2661 	}
2662 	memcpy(dev->ndev->dev_addr, p, ETH_ALEN);
2663 
2664 	/* IAHT and GAHT filter parameterization */
2665 	if (emac_has_feature(dev, EMAC_FTR_EMAC4SYNC)) {
2666 		dev->xaht_slots_shift = EMAC4SYNC_XAHT_SLOTS_SHIFT;
2667 		dev->xaht_width_shift = EMAC4SYNC_XAHT_WIDTH_SHIFT;
2668 	} else {
2669 		dev->xaht_slots_shift = EMAC4_XAHT_SLOTS_SHIFT;
2670 		dev->xaht_width_shift = EMAC4_XAHT_WIDTH_SHIFT;
2671 	}
2672 
2673 	DBG(dev, "features     : 0x%08x / 0x%08x\n", dev->features, EMAC_FTRS_POSSIBLE);
2674 	DBG(dev, "tx_fifo_size : %d (%d gige)\n", dev->tx_fifo_size, dev->tx_fifo_size_gige);
2675 	DBG(dev, "rx_fifo_size : %d (%d gige)\n", dev->rx_fifo_size, dev->rx_fifo_size_gige);
2676 	DBG(dev, "max_mtu      : %d\n", dev->max_mtu);
2677 	DBG(dev, "OPB freq     : %d\n", dev->opb_bus_freq);
2678 
2679 	return 0;
2680 }
2681 
2682 static const struct net_device_ops emac_netdev_ops = {
2683 	.ndo_open		= emac_open,
2684 	.ndo_stop		= emac_close,
2685 	.ndo_get_stats		= emac_stats,
2686 	.ndo_set_rx_mode	= emac_set_multicast_list,
2687 	.ndo_do_ioctl		= emac_ioctl,
2688 	.ndo_tx_timeout		= emac_tx_timeout,
2689 	.ndo_validate_addr	= eth_validate_addr,
2690 	.ndo_set_mac_address	= eth_mac_addr,
2691 	.ndo_start_xmit		= emac_start_xmit,
2692 	.ndo_change_mtu		= eth_change_mtu,
2693 };
2694 
2695 static const struct net_device_ops emac_gige_netdev_ops = {
2696 	.ndo_open		= emac_open,
2697 	.ndo_stop		= emac_close,
2698 	.ndo_get_stats		= emac_stats,
2699 	.ndo_set_rx_mode	= emac_set_multicast_list,
2700 	.ndo_do_ioctl		= emac_ioctl,
2701 	.ndo_tx_timeout		= emac_tx_timeout,
2702 	.ndo_validate_addr	= eth_validate_addr,
2703 	.ndo_set_mac_address	= eth_mac_addr,
2704 	.ndo_start_xmit		= emac_start_xmit_sg,
2705 	.ndo_change_mtu		= emac_change_mtu,
2706 };
2707 
2708 static int emac_probe(struct platform_device *ofdev)
2709 {
2710 	struct net_device *ndev;
2711 	struct emac_instance *dev;
2712 	struct device_node *np = ofdev->dev.of_node;
2713 	struct device_node **blist = NULL;
2714 	int err, i;
2715 
2716 	/* Skip unused/unwired EMACS.  We leave the check for an unused
2717 	 * property here for now, but new flat device trees should set a
2718 	 * status property to "disabled" instead.
2719 	 */
2720 	if (of_get_property(np, "unused", NULL) || !of_device_is_available(np))
2721 		return -ENODEV;
2722 
2723 	/* Find ourselves in the bootlist if we are there */
2724 	for (i = 0; i < EMAC_BOOT_LIST_SIZE; i++)
2725 		if (emac_boot_list[i] == np)
2726 			blist = &emac_boot_list[i];
2727 
2728 	/* Allocate our net_device structure */
2729 	err = -ENOMEM;
2730 	ndev = alloc_etherdev(sizeof(struct emac_instance));
2731 	if (!ndev)
2732 		goto err_gone;
2733 
2734 	dev = netdev_priv(ndev);
2735 	dev->ndev = ndev;
2736 	dev->ofdev = ofdev;
2737 	dev->blist = blist;
2738 	SET_NETDEV_DEV(ndev, &ofdev->dev);
2739 
2740 	/* Initialize some embedded data structures */
2741 	mutex_init(&dev->mdio_lock);
2742 	mutex_init(&dev->link_lock);
2743 	spin_lock_init(&dev->lock);
2744 	INIT_WORK(&dev->reset_work, emac_reset_work);
2745 
2746 	/* Init various config data based on device-tree */
2747 	err = emac_init_config(dev);
2748 	if (err != 0)
2749 		goto err_free;
2750 
2751 	/* Get interrupts. EMAC irq is mandatory, WOL irq is optional */
2752 	dev->emac_irq = irq_of_parse_and_map(np, 0);
2753 	dev->wol_irq = irq_of_parse_and_map(np, 1);
2754 	if (dev->emac_irq == NO_IRQ) {
2755 		printk(KERN_ERR "%s: Can't map main interrupt\n", np->full_name);
2756 		goto err_free;
2757 	}
2758 	ndev->irq = dev->emac_irq;
2759 
2760 	/* Map EMAC regs */
2761 	if (of_address_to_resource(np, 0, &dev->rsrc_regs)) {
2762 		printk(KERN_ERR "%s: Can't get registers address\n",
2763 		       np->full_name);
2764 		goto err_irq_unmap;
2765 	}
2766 	// TODO : request_mem_region
2767 	dev->emacp = ioremap(dev->rsrc_regs.start,
2768 			     resource_size(&dev->rsrc_regs));
2769 	if (dev->emacp == NULL) {
2770 		printk(KERN_ERR "%s: Can't map device registers!\n",
2771 		       np->full_name);
2772 		err = -ENOMEM;
2773 		goto err_irq_unmap;
2774 	}
2775 
2776 	/* Wait for dependent devices */
2777 	err = emac_wait_deps(dev);
2778 	if (err) {
2779 		printk(KERN_ERR
2780 		       "%s: Timeout waiting for dependent devices\n",
2781 		       np->full_name);
2782 		/*  display more info about what's missing ? */
2783 		goto err_reg_unmap;
2784 	}
2785 	dev->mal = platform_get_drvdata(dev->mal_dev);
2786 	if (dev->mdio_dev != NULL)
2787 		dev->mdio_instance = platform_get_drvdata(dev->mdio_dev);
2788 
2789 	/* Register with MAL */
2790 	dev->commac.ops = &emac_commac_ops;
2791 	dev->commac.dev = dev;
2792 	dev->commac.tx_chan_mask = MAL_CHAN_MASK(dev->mal_tx_chan);
2793 	dev->commac.rx_chan_mask = MAL_CHAN_MASK(dev->mal_rx_chan);
2794 	err = mal_register_commac(dev->mal, &dev->commac);
2795 	if (err) {
2796 		printk(KERN_ERR "%s: failed to register with mal %s!\n",
2797 		       np->full_name, dev->mal_dev->dev.of_node->full_name);
2798 		goto err_rel_deps;
2799 	}
2800 	dev->rx_skb_size = emac_rx_skb_size(ndev->mtu);
2801 	dev->rx_sync_size = emac_rx_sync_size(ndev->mtu);
2802 
2803 	/* Get pointers to BD rings */
2804 	dev->tx_desc =
2805 	    dev->mal->bd_virt + mal_tx_bd_offset(dev->mal, dev->mal_tx_chan);
2806 	dev->rx_desc =
2807 	    dev->mal->bd_virt + mal_rx_bd_offset(dev->mal, dev->mal_rx_chan);
2808 
2809 	DBG(dev, "tx_desc %p" NL, dev->tx_desc);
2810 	DBG(dev, "rx_desc %p" NL, dev->rx_desc);
2811 
2812 	/* Clean rings */
2813 	memset(dev->tx_desc, 0, NUM_TX_BUFF * sizeof(struct mal_descriptor));
2814 	memset(dev->rx_desc, 0, NUM_RX_BUFF * sizeof(struct mal_descriptor));
2815 	memset(dev->tx_skb, 0, NUM_TX_BUFF * sizeof(struct sk_buff *));
2816 	memset(dev->rx_skb, 0, NUM_RX_BUFF * sizeof(struct sk_buff *));
2817 
2818 	/* Attach to ZMII, if needed */
2819 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII) &&
2820 	    (err = zmii_attach(dev->zmii_dev, dev->zmii_port, &dev->phy_mode)) != 0)
2821 		goto err_unreg_commac;
2822 
2823 	/* Attach to RGMII, if needed */
2824 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII) &&
2825 	    (err = rgmii_attach(dev->rgmii_dev, dev->rgmii_port, dev->phy_mode)) != 0)
2826 		goto err_detach_zmii;
2827 
2828 	/* Attach to TAH, if needed */
2829 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH) &&
2830 	    (err = tah_attach(dev->tah_dev, dev->tah_port)) != 0)
2831 		goto err_detach_rgmii;
2832 
2833 	/* Set some link defaults before we can find out real parameters */
2834 	dev->phy.speed = SPEED_100;
2835 	dev->phy.duplex = DUPLEX_FULL;
2836 	dev->phy.autoneg = AUTONEG_DISABLE;
2837 	dev->phy.pause = dev->phy.asym_pause = 0;
2838 	dev->stop_timeout = STOP_TIMEOUT_100;
2839 	INIT_DELAYED_WORK(&dev->link_work, emac_link_timer);
2840 
2841 	/* Some SoCs like APM821xx does not support Half Duplex mode. */
2842 	if (emac_has_feature(dev, EMAC_FTR_APM821XX_NO_HALF_DUPLEX)) {
2843 		dev->phy_feat_exc = (SUPPORTED_1000baseT_Half |
2844 				     SUPPORTED_100baseT_Half |
2845 				     SUPPORTED_10baseT_Half);
2846 	}
2847 
2848 	/* Find PHY if any */
2849 	err = emac_init_phy(dev);
2850 	if (err != 0)
2851 		goto err_detach_tah;
2852 
2853 	if (dev->tah_dev) {
2854 		ndev->hw_features = NETIF_F_IP_CSUM | NETIF_F_SG;
2855 		ndev->features |= ndev->hw_features | NETIF_F_RXCSUM;
2856 	}
2857 	ndev->watchdog_timeo = 5 * HZ;
2858 	if (emac_phy_supports_gige(dev->phy_mode)) {
2859 		ndev->netdev_ops = &emac_gige_netdev_ops;
2860 		dev->commac.ops = &emac_commac_sg_ops;
2861 	} else
2862 		ndev->netdev_ops = &emac_netdev_ops;
2863 	ndev->ethtool_ops = &emac_ethtool_ops;
2864 
2865 	netif_carrier_off(ndev);
2866 
2867 	err = register_netdev(ndev);
2868 	if (err) {
2869 		printk(KERN_ERR "%s: failed to register net device (%d)!\n",
2870 		       np->full_name, err);
2871 		goto err_detach_tah;
2872 	}
2873 
2874 	/* Set our drvdata last as we don't want them visible until we are
2875 	 * fully initialized
2876 	 */
2877 	wmb();
2878 	platform_set_drvdata(ofdev, dev);
2879 
2880 	/* There's a new kid in town ! Let's tell everybody */
2881 	wake_up_all(&emac_probe_wait);
2882 
2883 
2884 	printk(KERN_INFO "%s: EMAC-%d %s, MAC %pM\n",
2885 	       ndev->name, dev->cell_index, np->full_name, ndev->dev_addr);
2886 
2887 	if (dev->phy_mode == PHY_MODE_SGMII)
2888 		printk(KERN_NOTICE "%s: in SGMII mode\n", ndev->name);
2889 
2890 	if (dev->phy.address >= 0)
2891 		printk("%s: found %s PHY (0x%02x)\n", ndev->name,
2892 		       dev->phy.def->name, dev->phy.address);
2893 
2894 	emac_dbg_register(dev);
2895 
2896 	/* Life is good */
2897 	return 0;
2898 
2899 	/* I have a bad feeling about this ... */
2900 
2901  err_detach_tah:
2902 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH))
2903 		tah_detach(dev->tah_dev, dev->tah_port);
2904  err_detach_rgmii:
2905 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
2906 		rgmii_detach(dev->rgmii_dev, dev->rgmii_port);
2907  err_detach_zmii:
2908 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
2909 		zmii_detach(dev->zmii_dev, dev->zmii_port);
2910  err_unreg_commac:
2911 	mal_unregister_commac(dev->mal, &dev->commac);
2912  err_rel_deps:
2913 	emac_put_deps(dev);
2914  err_reg_unmap:
2915 	iounmap(dev->emacp);
2916  err_irq_unmap:
2917 	if (dev->wol_irq != NO_IRQ)
2918 		irq_dispose_mapping(dev->wol_irq);
2919 	if (dev->emac_irq != NO_IRQ)
2920 		irq_dispose_mapping(dev->emac_irq);
2921  err_free:
2922 	free_netdev(ndev);
2923  err_gone:
2924 	/* if we were on the bootlist, remove us as we won't show up and
2925 	 * wake up all waiters to notify them in case they were waiting
2926 	 * on us
2927 	 */
2928 	if (blist) {
2929 		*blist = NULL;
2930 		wake_up_all(&emac_probe_wait);
2931 	}
2932 	return err;
2933 }
2934 
2935 static int emac_remove(struct platform_device *ofdev)
2936 {
2937 	struct emac_instance *dev = platform_get_drvdata(ofdev);
2938 
2939 	DBG(dev, "remove" NL);
2940 
2941 	unregister_netdev(dev->ndev);
2942 
2943 	cancel_work_sync(&dev->reset_work);
2944 
2945 	if (emac_has_feature(dev, EMAC_FTR_HAS_TAH))
2946 		tah_detach(dev->tah_dev, dev->tah_port);
2947 	if (emac_has_feature(dev, EMAC_FTR_HAS_RGMII))
2948 		rgmii_detach(dev->rgmii_dev, dev->rgmii_port);
2949 	if (emac_has_feature(dev, EMAC_FTR_HAS_ZMII))
2950 		zmii_detach(dev->zmii_dev, dev->zmii_port);
2951 
2952 	busy_phy_map &= ~(1 << dev->phy.address);
2953 	DBG(dev, "busy_phy_map now %#x" NL, busy_phy_map);
2954 
2955 	mal_unregister_commac(dev->mal, &dev->commac);
2956 	emac_put_deps(dev);
2957 
2958 	emac_dbg_unregister(dev);
2959 	iounmap(dev->emacp);
2960 
2961 	if (dev->wol_irq != NO_IRQ)
2962 		irq_dispose_mapping(dev->wol_irq);
2963 	if (dev->emac_irq != NO_IRQ)
2964 		irq_dispose_mapping(dev->emac_irq);
2965 
2966 	free_netdev(dev->ndev);
2967 
2968 	return 0;
2969 }
2970 
2971 /* XXX Features in here should be replaced by properties... */
2972 static const struct of_device_id emac_match[] =
2973 {
2974 	{
2975 		.type		= "network",
2976 		.compatible	= "ibm,emac",
2977 	},
2978 	{
2979 		.type		= "network",
2980 		.compatible	= "ibm,emac4",
2981 	},
2982 	{
2983 		.type		= "network",
2984 		.compatible	= "ibm,emac4sync",
2985 	},
2986 	{},
2987 };
2988 MODULE_DEVICE_TABLE(of, emac_match);
2989 
2990 static struct platform_driver emac_driver = {
2991 	.driver = {
2992 		.name = "emac",
2993 		.of_match_table = emac_match,
2994 	},
2995 	.probe = emac_probe,
2996 	.remove = emac_remove,
2997 };
2998 
2999 static void __init emac_make_bootlist(void)
3000 {
3001 	struct device_node *np = NULL;
3002 	int j, max, i = 0;
3003 	int cell_indices[EMAC_BOOT_LIST_SIZE];
3004 
3005 	/* Collect EMACs */
3006 	while((np = of_find_all_nodes(np)) != NULL) {
3007 		const u32 *idx;
3008 
3009 		if (of_match_node(emac_match, np) == NULL)
3010 			continue;
3011 		if (of_get_property(np, "unused", NULL))
3012 			continue;
3013 		idx = of_get_property(np, "cell-index", NULL);
3014 		if (idx == NULL)
3015 			continue;
3016 		cell_indices[i] = *idx;
3017 		emac_boot_list[i++] = of_node_get(np);
3018 		if (i >= EMAC_BOOT_LIST_SIZE) {
3019 			of_node_put(np);
3020 			break;
3021 		}
3022 	}
3023 	max = i;
3024 
3025 	/* Bubble sort them (doh, what a creative algorithm :-) */
3026 	for (i = 0; max > 1 && (i < (max - 1)); i++)
3027 		for (j = i; j < max; j++) {
3028 			if (cell_indices[i] > cell_indices[j]) {
3029 				swap(emac_boot_list[i], emac_boot_list[j]);
3030 				swap(cell_indices[i], cell_indices[j]);
3031 			}
3032 		}
3033 }
3034 
3035 static int __init emac_init(void)
3036 {
3037 	int rc;
3038 
3039 	printk(KERN_INFO DRV_DESC ", version " DRV_VERSION "\n");
3040 
3041 	/* Init debug stuff */
3042 	emac_init_debug();
3043 
3044 	/* Build EMAC boot list */
3045 	emac_make_bootlist();
3046 
3047 	/* Init submodules */
3048 	rc = mal_init();
3049 	if (rc)
3050 		goto err;
3051 	rc = zmii_init();
3052 	if (rc)
3053 		goto err_mal;
3054 	rc = rgmii_init();
3055 	if (rc)
3056 		goto err_zmii;
3057 	rc = tah_init();
3058 	if (rc)
3059 		goto err_rgmii;
3060 	rc = platform_driver_register(&emac_driver);
3061 	if (rc)
3062 		goto err_tah;
3063 
3064 	return 0;
3065 
3066  err_tah:
3067 	tah_exit();
3068  err_rgmii:
3069 	rgmii_exit();
3070  err_zmii:
3071 	zmii_exit();
3072  err_mal:
3073 	mal_exit();
3074  err:
3075 	return rc;
3076 }
3077 
3078 static void __exit emac_exit(void)
3079 {
3080 	int i;
3081 
3082 	platform_driver_unregister(&emac_driver);
3083 
3084 	tah_exit();
3085 	rgmii_exit();
3086 	zmii_exit();
3087 	mal_exit();
3088 	emac_fini_debug();
3089 
3090 	/* Destroy EMAC boot list */
3091 	for (i = 0; i < EMAC_BOOT_LIST_SIZE; i++)
3092 		of_node_put(emac_boot_list[i]);
3093 }
3094 
3095 module_init(emac_init);
3096 module_exit(emac_exit);
3097