1 /* QLogic qede NIC Driver
2  * Copyright (c) 2015-2017  QLogic Corporation
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and /or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 #ifndef _QEDE_H_
33 #define _QEDE_H_
34 #include <linux/compiler.h>
35 #include <linux/version.h>
36 #include <linux/workqueue.h>
37 #include <linux/netdevice.h>
38 #include <linux/interrupt.h>
39 #include <linux/bitmap.h>
40 #include <linux/kernel.h>
41 #include <linux/mutex.h>
42 #include <linux/bpf.h>
43 #include <net/xdp.h>
44 #include <linux/qed/qede_rdma.h>
45 #include <linux/io.h>
46 #ifdef CONFIG_RFS_ACCEL
47 #include <linux/cpu_rmap.h>
48 #endif
49 #include <linux/qed/common_hsi.h>
50 #include <linux/qed/eth_common.h>
51 #include <linux/qed/qed_if.h>
52 #include <linux/qed/qed_chain.h>
53 #include <linux/qed/qed_eth_if.h>
54 
55 #define QEDE_MAJOR_VERSION		8
56 #define QEDE_MINOR_VERSION		33
57 #define QEDE_REVISION_VERSION		0
58 #define QEDE_ENGINEERING_VERSION	20
59 #define DRV_MODULE_VERSION __stringify(QEDE_MAJOR_VERSION) "."	\
60 		__stringify(QEDE_MINOR_VERSION) "."		\
61 		__stringify(QEDE_REVISION_VERSION) "."		\
62 		__stringify(QEDE_ENGINEERING_VERSION)
63 
64 #define DRV_MODULE_SYM		qede
65 
66 struct qede_stats_common {
67 	u64 no_buff_discards;
68 	u64 packet_too_big_discard;
69 	u64 ttl0_discard;
70 	u64 rx_ucast_bytes;
71 	u64 rx_mcast_bytes;
72 	u64 rx_bcast_bytes;
73 	u64 rx_ucast_pkts;
74 	u64 rx_mcast_pkts;
75 	u64 rx_bcast_pkts;
76 	u64 mftag_filter_discards;
77 	u64 mac_filter_discards;
78 	u64 tx_ucast_bytes;
79 	u64 tx_mcast_bytes;
80 	u64 tx_bcast_bytes;
81 	u64 tx_ucast_pkts;
82 	u64 tx_mcast_pkts;
83 	u64 tx_bcast_pkts;
84 	u64 tx_err_drop_pkts;
85 	u64 coalesced_pkts;
86 	u64 coalesced_events;
87 	u64 coalesced_aborts_num;
88 	u64 non_coalesced_pkts;
89 	u64 coalesced_bytes;
90 
91 	/* port */
92 	u64 rx_64_byte_packets;
93 	u64 rx_65_to_127_byte_packets;
94 	u64 rx_128_to_255_byte_packets;
95 	u64 rx_256_to_511_byte_packets;
96 	u64 rx_512_to_1023_byte_packets;
97 	u64 rx_1024_to_1518_byte_packets;
98 	u64 rx_crc_errors;
99 	u64 rx_mac_crtl_frames;
100 	u64 rx_pause_frames;
101 	u64 rx_pfc_frames;
102 	u64 rx_align_errors;
103 	u64 rx_carrier_errors;
104 	u64 rx_oversize_packets;
105 	u64 rx_jabbers;
106 	u64 rx_undersize_packets;
107 	u64 rx_fragments;
108 	u64 tx_64_byte_packets;
109 	u64 tx_65_to_127_byte_packets;
110 	u64 tx_128_to_255_byte_packets;
111 	u64 tx_256_to_511_byte_packets;
112 	u64 tx_512_to_1023_byte_packets;
113 	u64 tx_1024_to_1518_byte_packets;
114 	u64 tx_pause_frames;
115 	u64 tx_pfc_frames;
116 	u64 brb_truncates;
117 	u64 brb_discards;
118 	u64 tx_mac_ctrl_frames;
119 };
120 
121 struct qede_stats_bb {
122 	u64 rx_1519_to_1522_byte_packets;
123 	u64 rx_1519_to_2047_byte_packets;
124 	u64 rx_2048_to_4095_byte_packets;
125 	u64 rx_4096_to_9216_byte_packets;
126 	u64 rx_9217_to_16383_byte_packets;
127 	u64 tx_1519_to_2047_byte_packets;
128 	u64 tx_2048_to_4095_byte_packets;
129 	u64 tx_4096_to_9216_byte_packets;
130 	u64 tx_9217_to_16383_byte_packets;
131 	u64 tx_lpi_entry_count;
132 	u64 tx_total_collisions;
133 };
134 
135 struct qede_stats_ah {
136 	u64 rx_1519_to_max_byte_packets;
137 	u64 tx_1519_to_max_byte_packets;
138 };
139 
140 struct qede_stats {
141 	struct qede_stats_common common;
142 
143 	union {
144 		struct qede_stats_bb bb;
145 		struct qede_stats_ah ah;
146 	};
147 };
148 
149 struct qede_vlan {
150 	struct list_head list;
151 	u16 vid;
152 	bool configured;
153 };
154 
155 struct qede_rdma_dev {
156 	struct qedr_dev *qedr_dev;
157 	struct list_head entry;
158 	struct list_head rdma_event_list;
159 	struct workqueue_struct *rdma_wq;
160 };
161 
162 struct qede_ptp;
163 
164 #define QEDE_RFS_MAX_FLTR	256
165 
166 struct qede_dev {
167 	struct qed_dev			*cdev;
168 	struct net_device		*ndev;
169 	struct pci_dev			*pdev;
170 
171 	u32				dp_module;
172 	u8				dp_level;
173 
174 	unsigned long flags;
175 #define QEDE_FLAG_IS_VF			BIT(0)
176 #define IS_VF(edev)	(!!((edev)->flags & QEDE_FLAG_IS_VF))
177 #define QEDE_TX_TIMESTAMPING_EN		BIT(1)
178 #define QEDE_FLAGS_PTP_TX_IN_PRORGESS	BIT(2)
179 
180 	const struct qed_eth_ops	*ops;
181 	struct qede_ptp			*ptp;
182 
183 	struct qed_dev_eth_info dev_info;
184 #define QEDE_MAX_RSS_CNT(edev)	((edev)->dev_info.num_queues)
185 #define QEDE_MAX_TSS_CNT(edev)	((edev)->dev_info.num_queues)
186 #define QEDE_IS_BB(edev) \
187 	((edev)->dev_info.common.dev_type == QED_DEV_TYPE_BB)
188 #define QEDE_IS_AH(edev) \
189 	((edev)->dev_info.common.dev_type == QED_DEV_TYPE_AH)
190 
191 	struct qede_fastpath		*fp_array;
192 	u8				req_num_tx;
193 	u8				fp_num_tx;
194 	u8				req_num_rx;
195 	u8				fp_num_rx;
196 	u16				req_queues;
197 	u16				num_queues;
198 #define QEDE_QUEUE_CNT(edev)	((edev)->num_queues)
199 #define QEDE_RSS_COUNT(edev)	((edev)->num_queues - (edev)->fp_num_tx)
200 #define QEDE_RX_QUEUE_IDX(edev, i)	(i)
201 #define QEDE_TSS_COUNT(edev)	((edev)->num_queues - (edev)->fp_num_rx)
202 
203 	struct qed_int_info		int_info;
204 
205 	/* Smaller private varaiant of the RTNL lock */
206 	struct mutex			qede_lock;
207 	u32				state; /* Protected by qede_lock */
208 	u16				rx_buf_size;
209 	u32				rx_copybreak;
210 
211 	/* L2 header size + 2*VLANs (8 bytes) + LLC SNAP (8 bytes) */
212 #define ETH_OVERHEAD			(ETH_HLEN + 8 + 8)
213 	/* Max supported alignment is 256 (8 shift)
214 	 * minimal alignment shift 6 is optimal for 57xxx HW performance
215 	 */
216 #define QEDE_RX_ALIGN_SHIFT		max(6, min(8, L1_CACHE_SHIFT))
217 	/* We assume skb_build() uses sizeof(struct skb_shared_info) bytes
218 	 * at the end of skb->data, to avoid wasting a full cache line.
219 	 * This reduces memory use (skb->truesize).
220 	 */
221 #define QEDE_FW_RX_ALIGN_END					\
222 	max_t(u64, 1UL << QEDE_RX_ALIGN_SHIFT,			\
223 	      SKB_DATA_ALIGN(sizeof(struct skb_shared_info)))
224 
225 	struct qede_stats		stats;
226 #define QEDE_RSS_INDIR_INITED	BIT(0)
227 #define QEDE_RSS_KEY_INITED	BIT(1)
228 #define QEDE_RSS_CAPS_INITED	BIT(2)
229 	u32 rss_params_inited; /* bit-field to track initialized rss params */
230 	u16 rss_ind_table[128];
231 	u32 rss_key[10];
232 	u8 rss_caps;
233 
234 	u16			q_num_rx_buffers; /* Must be a power of two */
235 	u16			q_num_tx_buffers; /* Must be a power of two */
236 
237 	bool gro_disable;
238 	struct list_head vlan_list;
239 	u16 configured_vlans;
240 	u16 non_configured_vlans;
241 	bool accept_any_vlan;
242 	struct delayed_work		sp_task;
243 	unsigned long			sp_flags;
244 	u16				vxlan_dst_port;
245 	u16				geneve_dst_port;
246 
247 	struct qede_arfs		*arfs;
248 	bool				wol_enabled;
249 
250 	struct qede_rdma_dev		rdma_info;
251 
252 	struct bpf_prog *xdp_prog;
253 };
254 
255 enum QEDE_STATE {
256 	QEDE_STATE_CLOSED,
257 	QEDE_STATE_OPEN,
258 };
259 
260 #define HILO_U64(hi, lo)		((((u64)(hi)) << 32) + (lo))
261 
262 #define	MAX_NUM_TC	8
263 #define	MAX_NUM_PRI	8
264 
265 /* The driver supports the new build_skb() API:
266  * RX ring buffer contains pointer to kmalloc() data only,
267  * skb are built only after the frame was DMA-ed.
268  */
269 struct sw_rx_data {
270 	struct page *data;
271 	dma_addr_t mapping;
272 	unsigned int page_offset;
273 };
274 
275 enum qede_agg_state {
276 	QEDE_AGG_STATE_NONE  = 0,
277 	QEDE_AGG_STATE_START = 1,
278 	QEDE_AGG_STATE_ERROR = 2
279 };
280 
281 struct qede_agg_info {
282 	/* rx_buf is a data buffer that can be placed / consumed from rx bd
283 	 * chain. It has two purposes: We will preallocate the data buffer
284 	 * for each aggregation when we open the interface and will place this
285 	 * buffer on the rx-bd-ring when we receive TPA_START. We don't want
286 	 * to be in a state where allocation fails, as we can't reuse the
287 	 * consumer buffer in the rx-chain since FW may still be writing to it
288 	 * (since header needs to be modified for TPA).
289 	 * The second purpose is to keep a pointer to the bd buffer during
290 	 * aggregation.
291 	 */
292 	struct sw_rx_data buffer;
293 	struct sk_buff *skb;
294 
295 	/* We need some structs from the start cookie until termination */
296 	u16 vlan_tag;
297 
298 	bool tpa_start_fail;
299 	u8 state;
300 	u8 frag_id;
301 
302 	u8 tunnel_type;
303 };
304 
305 struct qede_rx_queue {
306 	__le16 *hw_cons_ptr;
307 	void __iomem *hw_rxq_prod_addr;
308 
309 	/* Required for the allocation of replacement buffers */
310 	struct device *dev;
311 
312 	struct bpf_prog *xdp_prog;
313 
314 	u16 sw_rx_cons;
315 	u16 sw_rx_prod;
316 
317 	u16 filled_buffers;
318 	u8 data_direction;
319 	u8 rxq_id;
320 
321 	/* Used once per each NAPI run */
322 	u16 num_rx_buffers;
323 
324 	u16 rx_headroom;
325 
326 	u32 rx_buf_size;
327 	u32 rx_buf_seg_size;
328 
329 	struct sw_rx_data *sw_rx_ring;
330 	struct qed_chain rx_bd_ring;
331 	struct qed_chain rx_comp_ring ____cacheline_aligned;
332 
333 	/* GRO */
334 	struct qede_agg_info tpa_info[ETH_TPA_MAX_AGGS_NUM];
335 
336 	/* Used once per each NAPI run */
337 	u64 rcv_pkts;
338 
339 	u64 rx_hw_errors;
340 	u64 rx_alloc_errors;
341 	u64 rx_ip_frags;
342 
343 	u64 xdp_no_pass;
344 
345 	void *handle;
346 	struct xdp_rxq_info xdp_rxq;
347 };
348 
349 union db_prod {
350 	struct eth_db_data data;
351 	u32		raw;
352 };
353 
354 struct sw_tx_bd {
355 	struct sk_buff *skb;
356 	u8 flags;
357 /* Set on the first BD descriptor when there is a split BD */
358 #define QEDE_TSO_SPLIT_BD		BIT(0)
359 };
360 
361 struct sw_tx_xdp {
362 	struct page *page;
363 	dma_addr_t mapping;
364 };
365 
366 struct qede_tx_queue {
367 	u8 is_xdp;
368 	bool is_legacy;
369 	u16 sw_tx_cons;
370 	u16 sw_tx_prod;
371 	u16 num_tx_buffers; /* Slowpath only */
372 
373 	u64 xmit_pkts;
374 	u64 stopped_cnt;
375 
376 	__le16 *hw_cons_ptr;
377 
378 	/* Needed for the mapping of packets */
379 	struct device *dev;
380 
381 	void __iomem *doorbell_addr;
382 	union db_prod tx_db;
383 	int index; /* Slowpath only */
384 #define QEDE_TXQ_XDP_TO_IDX(edev, txq)	((txq)->index - \
385 					 QEDE_MAX_TSS_CNT(edev))
386 #define QEDE_TXQ_IDX_TO_XDP(edev, idx)	((idx) + QEDE_MAX_TSS_CNT(edev))
387 
388 	/* Regular Tx requires skb + metadata for release purpose,
389 	 * while XDP requires the pages and the mapped address.
390 	 */
391 	union {
392 		struct sw_tx_bd *skbs;
393 		struct sw_tx_xdp *xdp;
394 	} sw_tx_ring;
395 
396 	struct qed_chain tx_pbl;
397 
398 	/* Slowpath; Should be kept in end [unless missing padding] */
399 	void *handle;
400 };
401 
402 #define BD_UNMAP_ADDR(bd)		HILO_U64(le32_to_cpu((bd)->addr.hi), \
403 						 le32_to_cpu((bd)->addr.lo))
404 #define BD_SET_UNMAP_ADDR_LEN(bd, maddr, len)				\
405 	do {								\
406 		(bd)->addr.hi = cpu_to_le32(upper_32_bits(maddr));	\
407 		(bd)->addr.lo = cpu_to_le32(lower_32_bits(maddr));	\
408 		(bd)->nbytes = cpu_to_le16(len);			\
409 	} while (0)
410 #define BD_UNMAP_LEN(bd)		(le16_to_cpu((bd)->nbytes))
411 
412 struct qede_fastpath {
413 	struct qede_dev	*edev;
414 #define QEDE_FASTPATH_TX	BIT(0)
415 #define QEDE_FASTPATH_RX	BIT(1)
416 #define QEDE_FASTPATH_XDP	BIT(2)
417 #define QEDE_FASTPATH_COMBINED	(QEDE_FASTPATH_TX | QEDE_FASTPATH_RX)
418 	u8			type;
419 	u8			id;
420 	u8			xdp_xmit;
421 	struct napi_struct	napi;
422 	struct qed_sb_info	*sb_info;
423 	struct qede_rx_queue	*rxq;
424 	struct qede_tx_queue	*txq;
425 	struct qede_tx_queue	*xdp_tx;
426 
427 #define VEC_NAME_SIZE	(sizeof(((struct net_device *)0)->name) + 8)
428 	char	name[VEC_NAME_SIZE];
429 };
430 
431 /* Debug print definitions */
432 #define DP_NAME(edev) ((edev)->ndev->name)
433 
434 #define XMIT_PLAIN		0
435 #define XMIT_L4_CSUM		BIT(0)
436 #define XMIT_LSO		BIT(1)
437 #define XMIT_ENC		BIT(2)
438 #define XMIT_ENC_GSO_L4_CSUM	BIT(3)
439 
440 #define QEDE_CSUM_ERROR			BIT(0)
441 #define QEDE_CSUM_UNNECESSARY		BIT(1)
442 #define QEDE_TUNN_CSUM_UNNECESSARY	BIT(2)
443 
444 #define QEDE_SP_RX_MODE			1
445 
446 #ifdef CONFIG_RFS_ACCEL
447 int qede_rx_flow_steer(struct net_device *dev, const struct sk_buff *skb,
448 		       u16 rxq_index, u32 flow_id);
449 #define QEDE_SP_ARFS_CONFIG	4
450 #define QEDE_SP_TASK_POLL_DELAY	(5 * HZ)
451 #endif
452 
453 void qede_process_arfs_filters(struct qede_dev *edev, bool free_fltr);
454 void qede_poll_for_freeing_arfs_filters(struct qede_dev *edev);
455 void qede_arfs_filter_op(void *dev, void *filter, u8 fw_rc);
456 void qede_free_arfs(struct qede_dev *edev);
457 int qede_alloc_arfs(struct qede_dev *edev);
458 int qede_add_cls_rule(struct qede_dev *edev, struct ethtool_rxnfc *info);
459 int qede_del_cls_rule(struct qede_dev *edev, struct ethtool_rxnfc *info);
460 int qede_get_cls_rule_entry(struct qede_dev *edev, struct ethtool_rxnfc *cmd);
461 int qede_get_cls_rule_all(struct qede_dev *edev, struct ethtool_rxnfc *info,
462 			  u32 *rule_locs);
463 int qede_get_arfs_filter_count(struct qede_dev *edev);
464 
465 struct qede_reload_args {
466 	void (*func)(struct qede_dev *edev, struct qede_reload_args *args);
467 	union {
468 		netdev_features_t features;
469 		struct bpf_prog *new_prog;
470 		u16 mtu;
471 	} u;
472 };
473 
474 /* Datapath functions definition */
475 netdev_tx_t qede_start_xmit(struct sk_buff *skb, struct net_device *ndev);
476 netdev_features_t qede_features_check(struct sk_buff *skb,
477 				      struct net_device *dev,
478 				      netdev_features_t features);
479 void qede_tx_log_print(struct qede_dev *edev, struct qede_fastpath *fp);
480 int qede_alloc_rx_buffer(struct qede_rx_queue *rxq, bool allow_lazy);
481 int qede_free_tx_pkt(struct qede_dev *edev,
482 		     struct qede_tx_queue *txq, int *len);
483 int qede_poll(struct napi_struct *napi, int budget);
484 irqreturn_t qede_msix_fp_int(int irq, void *fp_cookie);
485 
486 /* Filtering function definitions */
487 void qede_force_mac(void *dev, u8 *mac, bool forced);
488 void qede_udp_ports_update(void *dev, u16 vxlan_port, u16 geneve_port);
489 int qede_set_mac_addr(struct net_device *ndev, void *p);
490 
491 int qede_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid);
492 int qede_vlan_rx_kill_vid(struct net_device *dev, __be16 proto, u16 vid);
493 void qede_vlan_mark_nonconfigured(struct qede_dev *edev);
494 int qede_configure_vlan_filters(struct qede_dev *edev);
495 
496 netdev_features_t qede_fix_features(struct net_device *dev,
497 				    netdev_features_t features);
498 int qede_set_features(struct net_device *dev, netdev_features_t features);
499 void qede_set_rx_mode(struct net_device *ndev);
500 void qede_config_rx_mode(struct net_device *ndev);
501 void qede_fill_rss_params(struct qede_dev *edev,
502 			  struct qed_update_vport_rss_params *rss, u8 *update);
503 
504 void qede_udp_tunnel_add(struct net_device *dev, struct udp_tunnel_info *ti);
505 void qede_udp_tunnel_del(struct net_device *dev, struct udp_tunnel_info *ti);
506 
507 int qede_xdp(struct net_device *dev, struct netdev_bpf *xdp);
508 
509 #ifdef CONFIG_DCB
510 void qede_set_dcbnl_ops(struct net_device *ndev);
511 #endif
512 
513 void qede_config_debug(uint debug, u32 *p_dp_module, u8 *p_dp_level);
514 void qede_set_ethtool_ops(struct net_device *netdev);
515 void qede_reload(struct qede_dev *edev,
516 		 struct qede_reload_args *args, bool is_locked);
517 int qede_change_mtu(struct net_device *dev, int new_mtu);
518 void qede_fill_by_demand_stats(struct qede_dev *edev);
519 void __qede_lock(struct qede_dev *edev);
520 void __qede_unlock(struct qede_dev *edev);
521 bool qede_has_rx_work(struct qede_rx_queue *rxq);
522 int qede_txq_has_work(struct qede_tx_queue *txq);
523 void qede_recycle_rx_bd_ring(struct qede_rx_queue *rxq, u8 count);
524 void qede_update_rx_prod(struct qede_dev *edev, struct qede_rx_queue *rxq);
525 
526 #define RX_RING_SIZE_POW	13
527 #define RX_RING_SIZE		((u16)BIT(RX_RING_SIZE_POW))
528 #define NUM_RX_BDS_MAX		(RX_RING_SIZE - 1)
529 #define NUM_RX_BDS_MIN		128
530 #define NUM_RX_BDS_DEF		((u16)BIT(10) - 1)
531 
532 #define TX_RING_SIZE_POW	13
533 #define TX_RING_SIZE		((u16)BIT(TX_RING_SIZE_POW))
534 #define NUM_TX_BDS_MAX		(TX_RING_SIZE - 1)
535 #define NUM_TX_BDS_MIN		128
536 #define NUM_TX_BDS_DEF		NUM_TX_BDS_MAX
537 
538 #define QEDE_MIN_PKT_LEN		64
539 #define QEDE_RX_HDR_SIZE		256
540 #define QEDE_MAX_JUMBO_PACKET_SIZE	9600
541 #define	for_each_queue(i) for (i = 0; i < edev->num_queues; i++)
542 
543 #endif /* _QEDE_H_ */
544