en_netdev.c revision 273246
1/*
2 * Copyright (c) 2007, 2014 Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses.  You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 *     Redistribution and use in source and binary forms, with or
11 *     without modification, are permitted provided that the following
12 *     conditions are met:
13 *
14 *      - Redistributions of source code must retain the above
15 *        copyright notice, this list of conditions and the following
16 *        disclaimer.
17 *
18 *      - Redistributions in binary form must reproduce the above
19 *        copyright notice, this list of conditions and the following
20 *        disclaimer in the documentation and/or other materials
21 *        provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 *
32 */
33
34#include <linux/etherdevice.h>
35#include <linux/delay.h>
36#include <linux/slab.h>
37#ifdef CONFIG_NET_RX_BUSY_POLL
38#include <net/busy_poll.h>
39#endif
40
41#include <linux/list.h>
42#include <linux/if_ether.h>
43
44#include <linux/mlx4/driver.h>
45#include <linux/mlx4/device.h>
46#include <linux/mlx4/cmd.h>
47#include <linux/mlx4/cq.h>
48
49#include <sys/sockio.h>
50#include <sys/sysctl.h>
51
52#include "mlx4_en.h"
53#include "en_port.h"
54
55static void mlx4_en_sysctl_stat(struct mlx4_en_priv *priv);
56static void mlx4_en_sysctl_conf(struct mlx4_en_priv *priv);
57static int mlx4_en_unit;
58
59#ifdef CONFIG_NET_RX_BUSY_POLL
60/* must be called with local_bh_disable()d */
61static int mlx4_en_low_latency_recv(struct napi_struct *napi)
62{
63	struct mlx4_en_cq *cq = container_of(napi, struct mlx4_en_cq, napi);
64	struct net_device *dev = cq->dev;
65	struct mlx4_en_priv *priv = netdev_priv(dev);
66	struct mlx4_en_rx_ring *rx_ring = priv->rx_ring[cq->ring];
67	int done;
68
69	if (!priv->port_up)
70		return LL_FLUSH_FAILED;
71
72	if (!mlx4_en_cq_lock_poll(cq))
73		return LL_FLUSH_BUSY;
74
75	done = mlx4_en_process_rx_cq(dev, cq, 4);
76#ifdef LL_EXTENDED_STATS
77	if (done)
78		rx_ring->cleaned += done;
79	else
80		rx_ring->misses++;
81#endif
82
83	mlx4_en_cq_unlock_poll(cq);
84
85	return done;
86}
87#endif	/* CONFIG_NET_RX_BUSY_POLL */
88
89#ifdef CONFIG_RFS_ACCEL
90
91struct mlx4_en_filter {
92	struct list_head next;
93	struct work_struct work;
94
95	u8     ip_proto;
96	__be32 src_ip;
97	__be32 dst_ip;
98	__be16 src_port;
99	__be16 dst_port;
100
101	int rxq_index;
102	struct mlx4_en_priv *priv;
103	u32 flow_id;			/* RFS infrastructure id */
104	int id;				/* mlx4_en driver id */
105	u64 reg_id;			/* Flow steering API id */
106	u8 activated;			/* Used to prevent expiry before filter
107					 * is attached
108					 */
109	struct hlist_node filter_chain;
110};
111
112static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv);
113
114static enum mlx4_net_trans_rule_id mlx4_ip_proto_to_trans_rule_id(u8 ip_proto)
115{
116	switch (ip_proto) {
117	case IPPROTO_UDP:
118		return MLX4_NET_TRANS_RULE_ID_UDP;
119	case IPPROTO_TCP:
120		return MLX4_NET_TRANS_RULE_ID_TCP;
121	default:
122		return -EPROTONOSUPPORT;
123	}
124};
125
126static void mlx4_en_filter_work(struct work_struct *work)
127{
128	struct mlx4_en_filter *filter = container_of(work,
129						     struct mlx4_en_filter,
130						     work);
131	struct mlx4_en_priv *priv = filter->priv;
132	struct mlx4_spec_list spec_tcp_udp = {
133		.id = mlx4_ip_proto_to_trans_rule_id(filter->ip_proto),
134		{
135			.tcp_udp = {
136				.dst_port = filter->dst_port,
137				.dst_port_msk = (__force __be16)-1,
138				.src_port = filter->src_port,
139				.src_port_msk = (__force __be16)-1,
140			},
141		},
142	};
143	struct mlx4_spec_list spec_ip = {
144		.id = MLX4_NET_TRANS_RULE_ID_IPV4,
145		{
146			.ipv4 = {
147				.dst_ip = filter->dst_ip,
148				.dst_ip_msk = (__force __be32)-1,
149				.src_ip = filter->src_ip,
150				.src_ip_msk = (__force __be32)-1,
151			},
152		},
153	};
154	struct mlx4_spec_list spec_eth = {
155		.id = MLX4_NET_TRANS_RULE_ID_ETH,
156	};
157	struct mlx4_net_trans_rule rule = {
158		.list = LIST_HEAD_INIT(rule.list),
159		.queue_mode = MLX4_NET_TRANS_Q_LIFO,
160		.exclusive = 1,
161		.allow_loopback = 1,
162		.promisc_mode = MLX4_FS_REGULAR,
163		.port = priv->port,
164		.priority = MLX4_DOMAIN_RFS,
165	};
166	int rc;
167	__be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16);
168
169	if (spec_tcp_udp.id < 0) {
170		en_warn(priv, "RFS: ignoring unsupported ip protocol (%d)\n",
171			filter->ip_proto);
172		goto ignore;
173	}
174	list_add_tail(&spec_eth.list, &rule.list);
175	list_add_tail(&spec_ip.list, &rule.list);
176	list_add_tail(&spec_tcp_udp.list, &rule.list);
177
178	rule.qpn = priv->rss_map.qps[filter->rxq_index].qpn;
179	memcpy(spec_eth.eth.dst_mac, priv->dev->dev_addr, ETH_ALEN);
180	memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN);
181
182	filter->activated = 0;
183
184	if (filter->reg_id) {
185		rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id);
186		if (rc && rc != -ENOENT)
187			en_err(priv, "Error detaching flow. rc = %d\n", rc);
188	}
189
190	rc = mlx4_flow_attach(priv->mdev->dev, &rule, &filter->reg_id);
191	if (rc)
192		en_err(priv, "Error attaching flow. err = %d\n", rc);
193
194ignore:
195	mlx4_en_filter_rfs_expire(priv);
196
197	filter->activated = 1;
198}
199
200static inline struct hlist_head *
201filter_hash_bucket(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip,
202		   __be16 src_port, __be16 dst_port)
203{
204	unsigned long l;
205	int bucket_idx;
206
207	l = (__force unsigned long)src_port |
208	    ((__force unsigned long)dst_port << 2);
209	l ^= (__force unsigned long)(src_ip ^ dst_ip);
210
211	bucket_idx = hash_long(l, MLX4_EN_FILTER_HASH_SHIFT);
212
213	return &priv->filter_hash[bucket_idx];
214}
215
216static struct mlx4_en_filter *
217mlx4_en_filter_alloc(struct mlx4_en_priv *priv, int rxq_index, __be32 src_ip,
218		     __be32 dst_ip, u8 ip_proto, __be16 src_port,
219		     __be16 dst_port, u32 flow_id)
220{
221	struct mlx4_en_filter *filter = NULL;
222
223	filter = kzalloc(sizeof(struct mlx4_en_filter), GFP_ATOMIC);
224	if (!filter)
225		return NULL;
226
227	filter->priv = priv;
228	filter->rxq_index = rxq_index;
229	INIT_WORK(&filter->work, mlx4_en_filter_work);
230
231	filter->src_ip = src_ip;
232	filter->dst_ip = dst_ip;
233	filter->ip_proto = ip_proto;
234	filter->src_port = src_port;
235	filter->dst_port = dst_port;
236
237	filter->flow_id = flow_id;
238
239	filter->id = priv->last_filter_id++ % RPS_NO_FILTER;
240
241	list_add_tail(&filter->next, &priv->filters);
242	hlist_add_head(&filter->filter_chain,
243		       filter_hash_bucket(priv, src_ip, dst_ip, src_port,
244					  dst_port));
245
246	return filter;
247}
248
249static void mlx4_en_filter_free(struct mlx4_en_filter *filter)
250{
251	struct mlx4_en_priv *priv = filter->priv;
252	int rc;
253
254	list_del(&filter->next);
255
256	rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id);
257	if (rc && rc != -ENOENT)
258		en_err(priv, "Error detaching flow. rc = %d\n", rc);
259
260	kfree(filter);
261}
262
263static inline struct mlx4_en_filter *
264mlx4_en_filter_find(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip,
265		    u8 ip_proto, __be16 src_port, __be16 dst_port)
266{
267	struct hlist_node *elem;
268	struct mlx4_en_filter *filter;
269	struct mlx4_en_filter *ret = NULL;
270
271	hlist_for_each_entry(filter, elem,
272			     filter_hash_bucket(priv, src_ip, dst_ip,
273						src_port, dst_port),
274			     filter_chain) {
275		if (filter->src_ip == src_ip &&
276		    filter->dst_ip == dst_ip &&
277		    filter->ip_proto == ip_proto &&
278		    filter->src_port == src_port &&
279		    filter->dst_port == dst_port) {
280			ret = filter;
281			break;
282		}
283	}
284
285	return ret;
286}
287
288static int
289mlx4_en_filter_rfs(struct net_device *net_dev, const struct sk_buff *skb,
290		   u16 rxq_index, u32 flow_id)
291{
292	struct mlx4_en_priv *priv = netdev_priv(net_dev);
293	struct mlx4_en_filter *filter;
294	const struct iphdr *ip;
295	const __be16 *ports;
296	u8 ip_proto;
297	__be32 src_ip;
298	__be32 dst_ip;
299	__be16 src_port;
300	__be16 dst_port;
301	int nhoff = skb_network_offset(skb);
302	int ret = 0;
303
304	if (skb->protocol != htons(ETH_P_IP))
305		return -EPROTONOSUPPORT;
306
307	ip = (const struct iphdr *)(skb->data + nhoff);
308	if (ip_is_fragment(ip))
309		return -EPROTONOSUPPORT;
310
311	if ((ip->protocol != IPPROTO_TCP) && (ip->protocol != IPPROTO_UDP))
312		return -EPROTONOSUPPORT;
313	ports = (const __be16 *)(skb->data + nhoff + 4 * ip->ihl);
314
315	ip_proto = ip->protocol;
316	src_ip = ip->saddr;
317	dst_ip = ip->daddr;
318	src_port = ports[0];
319	dst_port = ports[1];
320
321	spin_lock_bh(&priv->filters_lock);
322	filter = mlx4_en_filter_find(priv, src_ip, dst_ip, ip_proto,
323				     src_port, dst_port);
324	if (filter) {
325		if (filter->rxq_index == rxq_index)
326			goto out;
327
328		filter->rxq_index = rxq_index;
329	} else {
330		filter = mlx4_en_filter_alloc(priv, rxq_index,
331					      src_ip, dst_ip, ip_proto,
332					      src_port, dst_port, flow_id);
333		if (!filter) {
334			ret = -ENOMEM;
335			goto err;
336		}
337	}
338
339	queue_work(priv->mdev->workqueue, &filter->work);
340
341out:
342	ret = filter->id;
343err:
344	spin_unlock_bh(&priv->filters_lock);
345
346	return ret;
347}
348
349void mlx4_en_cleanup_filters(struct mlx4_en_priv *priv,
350			     struct mlx4_en_rx_ring *rx_ring)
351{
352	struct mlx4_en_filter *filter, *tmp;
353	LIST_HEAD(del_list);
354
355	spin_lock_bh(&priv->filters_lock);
356	list_for_each_entry_safe(filter, tmp, &priv->filters, next) {
357		list_move(&filter->next, &del_list);
358		hlist_del(&filter->filter_chain);
359	}
360	spin_unlock_bh(&priv->filters_lock);
361
362	list_for_each_entry_safe(filter, tmp, &del_list, next) {
363		cancel_work_sync(&filter->work);
364		mlx4_en_filter_free(filter);
365	}
366}
367
368static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv)
369{
370	struct mlx4_en_filter *filter = NULL, *tmp, *last_filter = NULL;
371	LIST_HEAD(del_list);
372	int i = 0;
373
374	spin_lock_bh(&priv->filters_lock);
375	list_for_each_entry_safe(filter, tmp, &priv->filters, next) {
376		if (i > MLX4_EN_FILTER_EXPIRY_QUOTA)
377			break;
378
379		if (filter->activated &&
380		    !work_pending(&filter->work) &&
381		    rps_may_expire_flow(priv->dev,
382					filter->rxq_index, filter->flow_id,
383					filter->id)) {
384			list_move(&filter->next, &del_list);
385			hlist_del(&filter->filter_chain);
386		} else
387			last_filter = filter;
388
389		i++;
390	}
391
392	if (last_filter && (&last_filter->next != priv->filters.next))
393		list_move(&priv->filters, &last_filter->next);
394
395	spin_unlock_bh(&priv->filters_lock);
396
397	list_for_each_entry_safe(filter, tmp, &del_list, next)
398		mlx4_en_filter_free(filter);
399}
400#endif
401
402static void mlx4_en_vlan_rx_add_vid(void *arg, struct net_device *dev, u16 vid)
403{
404	struct mlx4_en_priv *priv = netdev_priv(dev);
405	struct mlx4_en_dev *mdev = priv->mdev;
406	int err;
407	int idx;
408
409	if (arg != priv)
410		return;
411
412	en_dbg(HW, priv, "adding VLAN:%d\n", vid);
413
414	set_bit(vid, priv->active_vlans);
415
416	/* Add VID to port VLAN filter */
417	mutex_lock(&mdev->state_lock);
418	if (mdev->device_up && priv->port_up) {
419		err = mlx4_SET_VLAN_FLTR(mdev->dev, priv);
420		if (err)
421			en_err(priv, "Failed configuring VLAN filter\n");
422	}
423	if (mlx4_register_vlan(mdev->dev, priv->port, vid, &idx))
424		en_dbg(HW, priv, "failed adding vlan %d\n", vid);
425	mutex_unlock(&mdev->state_lock);
426
427}
428
429static void mlx4_en_vlan_rx_kill_vid(void *arg, struct net_device *dev, u16 vid)
430{
431	struct mlx4_en_priv *priv = netdev_priv(dev);
432	struct mlx4_en_dev *mdev = priv->mdev;
433	int err;
434
435	if (arg != priv)
436		return;
437
438	en_dbg(HW, priv, "Killing VID:%d\n", vid);
439
440	clear_bit(vid, priv->active_vlans);
441
442	/* Remove VID from port VLAN filter */
443	mutex_lock(&mdev->state_lock);
444	mlx4_unregister_vlan(mdev->dev, priv->port, vid);
445
446	if (mdev->device_up && priv->port_up) {
447		err = mlx4_SET_VLAN_FLTR(mdev->dev, priv);
448		if (err)
449			en_err(priv, "Failed configuring VLAN filter\n");
450	}
451	mutex_unlock(&mdev->state_lock);
452
453}
454
455static int mlx4_en_uc_steer_add(struct mlx4_en_priv *priv,
456				unsigned char *mac, int *qpn, u64 *reg_id)
457{
458	struct mlx4_en_dev *mdev = priv->mdev;
459	struct mlx4_dev *dev = mdev->dev;
460	int err;
461
462	switch (dev->caps.steering_mode) {
463	case MLX4_STEERING_MODE_B0: {
464		struct mlx4_qp qp;
465		u8 gid[16] = {0};
466
467		qp.qpn = *qpn;
468		memcpy(&gid[10], mac, ETH_ALEN);
469		gid[5] = priv->port;
470
471		err = mlx4_unicast_attach(dev, &qp, gid, 0, MLX4_PROT_ETH);
472		break;
473	}
474	case MLX4_STEERING_MODE_DEVICE_MANAGED: {
475		struct mlx4_spec_list spec_eth = { {NULL} };
476		__be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16);
477
478		struct mlx4_net_trans_rule rule = {
479			.queue_mode = MLX4_NET_TRANS_Q_FIFO,
480			.exclusive = 0,
481			.allow_loopback = 1,
482			.promisc_mode = MLX4_FS_REGULAR,
483			.priority = MLX4_DOMAIN_NIC,
484		};
485
486		rule.port = priv->port;
487		rule.qpn = *qpn;
488		INIT_LIST_HEAD(&rule.list);
489
490		spec_eth.id = MLX4_NET_TRANS_RULE_ID_ETH;
491		memcpy(spec_eth.eth.dst_mac, mac, ETH_ALEN);
492		memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN);
493		list_add_tail(&spec_eth.list, &rule.list);
494
495		err = mlx4_flow_attach(dev, &rule, reg_id);
496		break;
497	}
498	default:
499		return -EINVAL;
500	}
501	if (err)
502		en_warn(priv, "Failed Attaching Unicast\n");
503
504	return err;
505}
506
507static void mlx4_en_uc_steer_release(struct mlx4_en_priv *priv,
508				     unsigned char *mac, int qpn, u64 reg_id)
509{
510	struct mlx4_en_dev *mdev = priv->mdev;
511	struct mlx4_dev *dev = mdev->dev;
512
513	switch (dev->caps.steering_mode) {
514	case MLX4_STEERING_MODE_B0: {
515		struct mlx4_qp qp;
516		u8 gid[16] = {0};
517
518		qp.qpn = qpn;
519		memcpy(&gid[10], mac, ETH_ALEN);
520		gid[5] = priv->port;
521
522		mlx4_unicast_detach(dev, &qp, gid, MLX4_PROT_ETH);
523		break;
524	}
525	case MLX4_STEERING_MODE_DEVICE_MANAGED: {
526		mlx4_flow_detach(dev, reg_id);
527		break;
528	}
529	default:
530		en_err(priv, "Invalid steering mode.\n");
531	}
532}
533
534static int mlx4_en_get_qp(struct mlx4_en_priv *priv)
535{
536	struct mlx4_en_dev *mdev = priv->mdev;
537	struct mlx4_dev *dev = mdev->dev;
538	struct mlx4_mac_entry *entry;
539	int index = 0;
540	int err = 0;
541	u64 reg_id;
542	int *qpn = &priv->base_qpn;
543	u64 mac = mlx4_mac_to_u64(IF_LLADDR(priv->dev));
544
545	en_dbg(DRV, priv, "Registering MAC: %pM for adding\n",
546	       IF_LLADDR(priv->dev));
547	index = mlx4_register_mac(dev, priv->port, mac);
548	if (index < 0) {
549		err = index;
550		en_err(priv, "Failed adding MAC: %pM\n",
551		       IF_LLADDR(priv->dev));
552		return err;
553	}
554
555	if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) {
556		int base_qpn = mlx4_get_base_qpn(dev, priv->port);
557		*qpn = base_qpn + index;
558		return 0;
559	}
560
561	err = mlx4_qp_reserve_range(dev, 1, 1, qpn, 0);
562	en_dbg(DRV, priv, "Reserved qp %d\n", *qpn);
563	if (err) {
564		en_err(priv, "Failed to reserve qp for mac registration\n");
565		goto qp_err;
566	}
567
568	err = mlx4_en_uc_steer_add(priv, IF_LLADDR(priv->dev), qpn, &reg_id);
569	if (err)
570		goto steer_err;
571
572	entry = kmalloc(sizeof(*entry), GFP_KERNEL);
573	if (!entry) {
574		err = -ENOMEM;
575		goto alloc_err;
576	}
577	memcpy(entry->mac, IF_LLADDR(priv->dev), sizeof(entry->mac));
578	entry->reg_id = reg_id;
579
580	hlist_add_head(&entry->hlist,
581			   &priv->mac_hash[entry->mac[MLX4_EN_MAC_HASH_IDX]]);
582
583	return 0;
584
585alloc_err:
586	mlx4_en_uc_steer_release(priv, IF_LLADDR(priv->dev), *qpn, reg_id);
587
588steer_err:
589	mlx4_qp_release_range(dev, *qpn, 1);
590
591qp_err:
592	mlx4_unregister_mac(dev, priv->port, mac);
593	return err;
594}
595
596static void mlx4_en_put_qp(struct mlx4_en_priv *priv)
597{
598	struct mlx4_en_dev *mdev = priv->mdev;
599	struct mlx4_dev *dev = mdev->dev;
600	int qpn = priv->base_qpn;
601	u64 mac;
602
603	if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) {
604		mac = mlx4_mac_to_u64(IF_LLADDR(priv->dev));
605		en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n",
606		       IF_LLADDR(priv->dev));
607		mlx4_unregister_mac(dev, priv->port, mac);
608	} else {
609		struct mlx4_mac_entry *entry;
610		struct hlist_node *n, *tmp;
611		struct hlist_head *bucket;
612		unsigned int i;
613
614		for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) {
615			bucket = &priv->mac_hash[i];
616			hlist_for_each_entry_safe(entry, n, tmp, bucket, hlist) {
617				mac = mlx4_mac_to_u64(entry->mac);
618				en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n",
619				       entry->mac);
620				mlx4_en_uc_steer_release(priv, entry->mac,
621							 qpn, entry->reg_id);
622
623				mlx4_unregister_mac(dev, priv->port, mac);
624				hlist_del(&entry->hlist);
625				kfree(entry);
626			}
627		}
628
629		en_dbg(DRV, priv, "Releasing qp: port %d, qpn %d\n",
630		       priv->port, qpn);
631		mlx4_qp_release_range(dev, qpn, 1);
632		priv->flags &= ~MLX4_EN_FLAG_FORCE_PROMISC;
633	}
634}
635
636static void mlx4_en_clear_list(struct net_device *dev)
637{
638	struct mlx4_en_priv *priv = netdev_priv(dev);
639	struct mlx4_en_mc_list *tmp, *mc_to_del;
640
641	list_for_each_entry_safe(mc_to_del, tmp, &priv->mc_list, list) {
642		list_del(&mc_to_del->list);
643		kfree(mc_to_del);
644	}
645}
646
647static void mlx4_en_cache_mclist(struct net_device *dev)
648{
649        struct ifmultiaddr *ifma;
650	struct mlx4_en_mc_list *tmp;
651	struct mlx4_en_priv *priv = netdev_priv(dev);
652
653        TAILQ_FOREACH(ifma, &dev->if_multiaddrs, ifma_link) {
654                if (ifma->ifma_addr->sa_family != AF_LINK)
655                        continue;
656                if (((struct sockaddr_dl *)ifma->ifma_addr)->sdl_alen !=
657                                ETHER_ADDR_LEN)
658                        continue;
659                /* Make sure the list didn't grow. */
660		tmp = kzalloc(sizeof(struct mlx4_en_mc_list), GFP_ATOMIC);
661		memcpy(tmp->addr,
662			LLADDR((struct sockaddr_dl *)ifma->ifma_addr), ETH_ALEN);
663		list_add_tail(&tmp->list, &priv->mc_list);
664        }
665}
666
667static void update_mclist_flags(struct mlx4_en_priv *priv,
668				struct list_head *dst,
669				struct list_head *src)
670{
671	struct mlx4_en_mc_list *dst_tmp, *src_tmp, *new_mc;
672	bool found;
673
674	/* Find all the entries that should be removed from dst,
675	 * These are the entries that are not found in src
676	 */
677	list_for_each_entry(dst_tmp, dst, list) {
678		found = false;
679		list_for_each_entry(src_tmp, src, list) {
680			if (!memcmp(dst_tmp->addr, src_tmp->addr, ETH_ALEN)) {
681				found = true;
682				break;
683			}
684		}
685		if (!found)
686			dst_tmp->action = MCLIST_REM;
687	}
688
689	/* Add entries that exist in src but not in dst
690	 * mark them as need to add
691	 */
692	list_for_each_entry(src_tmp, src, list) {
693		found = false;
694		list_for_each_entry(dst_tmp, dst, list) {
695			if (!memcmp(dst_tmp->addr, src_tmp->addr, ETH_ALEN)) {
696				dst_tmp->action = MCLIST_NONE;
697				found = true;
698				break;
699			}
700		}
701		if (!found) {
702			new_mc = kmalloc(sizeof(struct mlx4_en_mc_list),
703					 GFP_KERNEL);
704			if (!new_mc) {
705				en_err(priv, "Failed to allocate current multicast list\n");
706				return;
707			}
708			memcpy(new_mc, src_tmp,
709			       sizeof(struct mlx4_en_mc_list));
710			new_mc->action = MCLIST_ADD;
711			list_add_tail(&new_mc->list, dst);
712		}
713	}
714}
715
716static void mlx4_en_set_rx_mode(struct net_device *dev)
717{
718	struct mlx4_en_priv *priv = netdev_priv(dev);
719
720	if (!priv->port_up)
721		return;
722
723	queue_work(priv->mdev->workqueue, &priv->rx_mode_task);
724}
725
726static void mlx4_en_set_promisc_mode(struct mlx4_en_priv *priv,
727				     struct mlx4_en_dev *mdev)
728{
729	int err = 0;
730	if (!(priv->flags & MLX4_EN_FLAG_PROMISC)) {
731		priv->flags |= MLX4_EN_FLAG_PROMISC;
732
733		/* Enable promiscouos mode */
734		switch (mdev->dev->caps.steering_mode) {
735		case MLX4_STEERING_MODE_DEVICE_MANAGED:
736			err = mlx4_flow_steer_promisc_add(mdev->dev,
737							  priv->port,
738							  priv->base_qpn,
739							  MLX4_FS_ALL_DEFAULT);
740			if (err)
741				en_err(priv, "Failed enabling promiscuous mode\n");
742			priv->flags |= MLX4_EN_FLAG_MC_PROMISC;
743			break;
744
745		case MLX4_STEERING_MODE_B0:
746			err = mlx4_unicast_promisc_add(mdev->dev,
747						       priv->base_qpn,
748						       priv->port);
749			if (err)
750				en_err(priv, "Failed enabling unicast promiscuous mode\n");
751
752			/* Add the default qp number as multicast
753			 * promisc
754			 */
755			if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) {
756				err = mlx4_multicast_promisc_add(mdev->dev,
757								 priv->base_qpn,
758								 priv->port);
759				if (err)
760					en_err(priv, "Failed enabling multicast promiscuous mode\n");
761				priv->flags |= MLX4_EN_FLAG_MC_PROMISC;
762			}
763			break;
764
765		case MLX4_STEERING_MODE_A0:
766			err = mlx4_SET_PORT_qpn_calc(mdev->dev,
767						     priv->port,
768						     priv->base_qpn,
769						     1);
770			if (err)
771				en_err(priv, "Failed enabling promiscuous mode\n");
772			break;
773		}
774
775		/* Disable port multicast filter (unconditionally) */
776		err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0,
777					  0, MLX4_MCAST_DISABLE);
778		if (err)
779			en_err(priv, "Failed disabling multicast filter\n");
780	}
781}
782
783static void mlx4_en_clear_promisc_mode(struct mlx4_en_priv *priv,
784				       struct mlx4_en_dev *mdev)
785{
786	int err = 0;
787
788	priv->flags &= ~MLX4_EN_FLAG_PROMISC;
789
790	/* Disable promiscouos mode */
791	switch (mdev->dev->caps.steering_mode) {
792	case MLX4_STEERING_MODE_DEVICE_MANAGED:
793		err = mlx4_flow_steer_promisc_remove(mdev->dev,
794						     priv->port,
795						     MLX4_FS_ALL_DEFAULT);
796		if (err)
797			en_err(priv, "Failed disabling promiscuous mode\n");
798		priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC;
799		break;
800
801	case MLX4_STEERING_MODE_B0:
802		err = mlx4_unicast_promisc_remove(mdev->dev,
803						  priv->base_qpn,
804						  priv->port);
805		if (err)
806			en_err(priv, "Failed disabling unicast promiscuous mode\n");
807		/* Disable Multicast promisc */
808		if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) {
809			err = mlx4_multicast_promisc_remove(mdev->dev,
810							    priv->base_qpn,
811							    priv->port);
812			if (err)
813				en_err(priv, "Failed disabling multicast promiscuous mode\n");
814			priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC;
815		}
816		break;
817
818	case MLX4_STEERING_MODE_A0:
819		err = mlx4_SET_PORT_qpn_calc(mdev->dev,
820					     priv->port,
821					     priv->base_qpn, 0);
822		if (err)
823			en_err(priv, "Failed disabling promiscuous mode\n");
824		break;
825	}
826}
827
828static void mlx4_en_do_multicast(struct mlx4_en_priv *priv,
829				 struct net_device *dev,
830				 struct mlx4_en_dev *mdev)
831{
832	struct mlx4_en_mc_list *mclist, *tmp;
833	u8 mc_list[16] = {0};
834	int err = 0;
835	u64 mcast_addr = 0;
836
837
838	/* Enable/disable the multicast filter according to IFF_ALLMULTI */
839	if (dev->if_flags & IFF_ALLMULTI) {
840		err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0,
841					  0, MLX4_MCAST_DISABLE);
842		if (err)
843			en_err(priv, "Failed disabling multicast filter\n");
844
845		/* Add the default qp number as multicast promisc */
846		if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) {
847			switch (mdev->dev->caps.steering_mode) {
848			case MLX4_STEERING_MODE_DEVICE_MANAGED:
849				err = mlx4_flow_steer_promisc_add(mdev->dev,
850								  priv->port,
851								  priv->base_qpn,
852								  MLX4_FS_MC_DEFAULT);
853				break;
854
855			case MLX4_STEERING_MODE_B0:
856				err = mlx4_multicast_promisc_add(mdev->dev,
857								 priv->base_qpn,
858								 priv->port);
859				break;
860
861			case MLX4_STEERING_MODE_A0:
862				break;
863			}
864			if (err)
865				en_err(priv, "Failed entering multicast promisc mode\n");
866			priv->flags |= MLX4_EN_FLAG_MC_PROMISC;
867		}
868	} else {
869		/* Disable Multicast promisc */
870		if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) {
871			switch (mdev->dev->caps.steering_mode) {
872			case MLX4_STEERING_MODE_DEVICE_MANAGED:
873				err = mlx4_flow_steer_promisc_remove(mdev->dev,
874								     priv->port,
875								     MLX4_FS_MC_DEFAULT);
876				break;
877
878			case MLX4_STEERING_MODE_B0:
879				err = mlx4_multicast_promisc_remove(mdev->dev,
880								    priv->base_qpn,
881								    priv->port);
882				break;
883
884			case MLX4_STEERING_MODE_A0:
885				break;
886			}
887			if (err)
888				en_err(priv, "Failed disabling multicast promiscuous mode\n");
889			priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC;
890		}
891
892		err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0,
893					  0, MLX4_MCAST_DISABLE);
894		if (err)
895			en_err(priv, "Failed disabling multicast filter\n");
896
897		/* Flush mcast filter and init it with broadcast address */
898		mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, ETH_BCAST,
899				    1, MLX4_MCAST_CONFIG);
900
901		/* Update multicast list - we cache all addresses so they won't
902		 * change while HW is updated holding the command semaphor */
903		mlx4_en_cache_mclist(dev);
904		list_for_each_entry(mclist, &priv->mc_list, list) {
905			mcast_addr = mlx4_mac_to_u64(mclist->addr);
906			mlx4_SET_MCAST_FLTR(mdev->dev, priv->port,
907					mcast_addr, 0, MLX4_MCAST_CONFIG);
908		}
909		err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0,
910					  0, MLX4_MCAST_ENABLE);
911		if (err)
912			en_err(priv, "Failed enabling multicast filter\n");
913
914		update_mclist_flags(priv, &priv->curr_list, &priv->mc_list);
915		list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) {
916			if (mclist->action == MCLIST_REM) {
917				/* detach this address and delete from list */
918				memcpy(&mc_list[10], mclist->addr, ETH_ALEN);
919				mc_list[5] = priv->port;
920				err = mlx4_multicast_detach(mdev->dev,
921							    &priv->rss_map.indir_qp,
922							    mc_list,
923							    MLX4_PROT_ETH,
924							    mclist->reg_id);
925				if (err)
926					en_err(priv, "Fail to detach multicast address\n");
927
928				/* remove from list */
929				list_del(&mclist->list);
930				kfree(mclist);
931			} else if (mclist->action == MCLIST_ADD) {
932				/* attach the address */
933				memcpy(&mc_list[10], mclist->addr, ETH_ALEN);
934				/* needed for B0 steering support */
935				mc_list[5] = priv->port;
936				err = mlx4_multicast_attach(mdev->dev,
937							    &priv->rss_map.indir_qp,
938							    mc_list,
939							    priv->port, 0,
940							    MLX4_PROT_ETH,
941							    &mclist->reg_id);
942				if (err)
943					en_err(priv, "Fail to attach multicast address\n");
944
945			}
946		}
947	}
948}
949
950static void mlx4_en_do_set_rx_mode(struct work_struct *work)
951{
952	struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv,
953						 rx_mode_task);
954	struct mlx4_en_dev *mdev = priv->mdev;
955	struct net_device *dev = priv->dev;
956
957
958	mutex_lock(&mdev->state_lock);
959	if (!mdev->device_up) {
960		en_dbg(HW, priv, "Card is not up, ignoring rx mode change.\n");
961		goto out;
962	}
963	if (!priv->port_up) {
964		en_dbg(HW, priv, "Port is down, ignoring rx mode change.\n");
965		goto out;
966	}
967	if (!mlx4_en_QUERY_PORT(mdev, priv->port)) {
968		if (priv->port_state.link_state) {
969			priv->last_link_state = MLX4_DEV_EVENT_PORT_UP;
970			/* Important note: the following call for if_link_state_change
971			 * is needed for interface up scenario (start port, link state
972			 * change) */
973			if_link_state_change(priv->dev, LINK_STATE_UP);
974			en_dbg(HW, priv, "Link Up\n");
975		}
976	}
977
978	/* Promsicuous mode: disable all filters */
979	if ((dev->if_flags & IFF_PROMISC) ||
980	    (priv->flags & MLX4_EN_FLAG_FORCE_PROMISC)) {
981		mlx4_en_set_promisc_mode(priv, mdev);
982		goto out;
983	}
984
985	/* Not in promiscuous mode */
986	if (priv->flags & MLX4_EN_FLAG_PROMISC)
987		mlx4_en_clear_promisc_mode(priv, mdev);
988
989	mlx4_en_do_multicast(priv, dev, mdev);
990out:
991	mutex_unlock(&mdev->state_lock);
992}
993
994#ifdef CONFIG_NET_POLL_CONTROLLER
995static void mlx4_en_netpoll(struct net_device *dev)
996{
997	struct mlx4_en_priv *priv = netdev_priv(dev);
998	struct mlx4_en_cq *cq;
999	unsigned long flags;
1000	int i;
1001
1002	for (i = 0; i < priv->rx_ring_num; i++) {
1003		cq = priv->rx_cq[i];
1004		spin_lock_irqsave(&cq->lock, flags);
1005		napi_synchronize(&cq->napi);
1006		mlx4_en_process_rx_cq(dev, cq, 0);
1007		spin_unlock_irqrestore(&cq->lock, flags);
1008	}
1009}
1010#endif
1011
1012static void mlx4_en_watchdog_timeout(void *arg)
1013{
1014        struct mlx4_en_priv *priv = arg;
1015        struct mlx4_en_dev *mdev = priv->mdev;
1016
1017        en_dbg(DRV, priv, "Scheduling watchdog\n");
1018        queue_work(mdev->workqueue, &priv->watchdog_task);
1019        if (priv->port_up)
1020                callout_reset(&priv->watchdog_timer, MLX4_EN_WATCHDOG_TIMEOUT,
1021                                mlx4_en_watchdog_timeout, priv);
1022}
1023
1024
1025
1026static void mlx4_en_set_default_moderation(struct mlx4_en_priv *priv)
1027{
1028	struct mlx4_en_cq *cq;
1029	int i;
1030
1031	/* If we haven't received a specific coalescing setting
1032	 * (module param), we set the moderation parameters as follows:
1033	 * - moder_cnt is set to the number of mtu sized packets to
1034	 *   satisfy our coelsing target.
1035	 * - moder_time is set to a fixed value.
1036	 */
1037	priv->rx_frames = MLX4_EN_RX_COAL_TARGET / priv->dev->if_mtu + 1;
1038	priv->rx_usecs = MLX4_EN_RX_COAL_TIME;
1039	priv->tx_frames = MLX4_EN_TX_COAL_PKTS;
1040	priv->tx_usecs = MLX4_EN_TX_COAL_TIME;
1041	en_dbg(INTR, priv, "Default coalesing params for mtu: %u - "
1042	       "rx_frames:%d rx_usecs:%d\n",
1043	       (unsigned)priv->dev->if_mtu, priv->rx_frames, priv->rx_usecs);
1044
1045	/* Setup cq moderation params */
1046	for (i = 0; i < priv->rx_ring_num; i++) {
1047		cq = priv->rx_cq[i];
1048		cq->moder_cnt = priv->rx_frames;
1049		cq->moder_time = priv->rx_usecs;
1050		priv->last_moder_time[i] = MLX4_EN_AUTO_CONF;
1051		priv->last_moder_packets[i] = 0;
1052		priv->last_moder_bytes[i] = 0;
1053	}
1054
1055	for (i = 0; i < priv->tx_ring_num; i++) {
1056		cq = priv->tx_cq[i];
1057		cq->moder_cnt = priv->tx_frames;
1058		cq->moder_time = priv->tx_usecs;
1059	}
1060
1061	/* Reset auto-moderation params */
1062	priv->pkt_rate_low = MLX4_EN_RX_RATE_LOW;
1063	priv->rx_usecs_low = MLX4_EN_RX_COAL_TIME_LOW;
1064	priv->pkt_rate_high = MLX4_EN_RX_RATE_HIGH;
1065	priv->rx_usecs_high = MLX4_EN_RX_COAL_TIME_HIGH;
1066	priv->sample_interval = MLX4_EN_SAMPLE_INTERVAL;
1067	priv->adaptive_rx_coal = 1;
1068	priv->last_moder_jiffies = 0;
1069	priv->last_moder_tx_packets = 0;
1070}
1071
1072static void mlx4_en_auto_moderation(struct mlx4_en_priv *priv)
1073{
1074	unsigned long period = (unsigned long) (jiffies - priv->last_moder_jiffies);
1075	struct mlx4_en_cq *cq;
1076	unsigned long packets;
1077	unsigned long rate;
1078	unsigned long avg_pkt_size;
1079	unsigned long rx_packets;
1080	unsigned long rx_bytes;
1081	unsigned long rx_pkt_diff;
1082	int moder_time;
1083	int ring, err;
1084
1085	if (!priv->adaptive_rx_coal || period < priv->sample_interval * HZ)
1086		return;
1087
1088	for (ring = 0; ring < priv->rx_ring_num; ring++) {
1089                spin_lock(&priv->stats_lock);
1090		rx_packets = priv->rx_ring[ring]->packets;
1091		rx_bytes = priv->rx_ring[ring]->bytes;
1092		spin_unlock(&priv->stats_lock);
1093
1094		rx_pkt_diff = ((unsigned long) (rx_packets -
1095				priv->last_moder_packets[ring]));
1096		packets = rx_pkt_diff;
1097		rate = packets * HZ / period;
1098		avg_pkt_size = packets ? ((unsigned long) (rx_bytes -
1099				priv->last_moder_bytes[ring])) / packets : 0;
1100
1101		/* Apply auto-moderation only when packet rate
1102		 * exceeds a rate that it matters */
1103		if (rate > (MLX4_EN_RX_RATE_THRESH / priv->rx_ring_num) &&
1104		    avg_pkt_size > MLX4_EN_AVG_PKT_SMALL) {
1105			if (rate < priv->pkt_rate_low)
1106				moder_time = priv->rx_usecs_low;
1107			else if (rate > priv->pkt_rate_high)
1108				moder_time = priv->rx_usecs_high;
1109			else
1110				moder_time = (rate - priv->pkt_rate_low) *
1111					(priv->rx_usecs_high - priv->rx_usecs_low) /
1112					(priv->pkt_rate_high - priv->pkt_rate_low) +
1113					priv->rx_usecs_low;
1114		} else {
1115			moder_time = priv->rx_usecs_low;
1116		}
1117
1118		if (moder_time != priv->last_moder_time[ring]) {
1119			priv->last_moder_time[ring] = moder_time;
1120			cq = priv->rx_cq[ring];
1121			cq->moder_time = moder_time;
1122			err = mlx4_en_set_cq_moder(priv, cq);
1123			if (err)
1124				en_err(priv, "Failed modifying moderation for cq:%d\n",
1125				       ring);
1126		}
1127		priv->last_moder_packets[ring] = rx_packets;
1128		priv->last_moder_bytes[ring] = rx_bytes;
1129	}
1130
1131	priv->last_moder_jiffies = jiffies;
1132}
1133
1134static void mlx4_en_do_get_stats(struct work_struct *work)
1135{
1136	struct delayed_work *delay = to_delayed_work(work);
1137	struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv,
1138						 stats_task);
1139	struct mlx4_en_dev *mdev = priv->mdev;
1140	int err;
1141
1142	mutex_lock(&mdev->state_lock);
1143	if (mdev->device_up) {
1144		if (priv->port_up) {
1145                        err = mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 0);
1146			if (err)
1147				en_dbg(HW, priv, "Could not update stats\n");
1148
1149			mlx4_en_auto_moderation(priv);
1150		}
1151
1152		queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY);
1153	}
1154	mutex_unlock(&mdev->state_lock);
1155}
1156
1157/* mlx4_en_service_task - Run service task for tasks that needed to be done
1158 * periodically
1159 */
1160static void mlx4_en_service_task(struct work_struct *work)
1161{
1162	struct delayed_work *delay = to_delayed_work(work);
1163	struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv,
1164						 service_task);
1165	struct mlx4_en_dev *mdev = priv->mdev;
1166
1167	mutex_lock(&mdev->state_lock);
1168	if (mdev->device_up) {
1169		queue_delayed_work(mdev->workqueue, &priv->service_task,
1170				   SERVICE_TASK_DELAY);
1171	}
1172	mutex_unlock(&mdev->state_lock);
1173}
1174
1175static void mlx4_en_linkstate(struct work_struct *work)
1176{
1177	struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv,
1178						 linkstate_task);
1179	struct mlx4_en_dev *mdev = priv->mdev;
1180	int linkstate = priv->link_state;
1181
1182	mutex_lock(&mdev->state_lock);
1183	/* If observable port state changed set carrier state and
1184	 * report to system log */
1185	if (priv->last_link_state != linkstate) {
1186		if (linkstate == MLX4_DEV_EVENT_PORT_DOWN) {
1187			en_info(priv, "Link Down\n");
1188			if_link_state_change(priv->dev, LINK_STATE_DOWN);
1189		/* make sure the port is up before notifying the OS.
1190		 * This is tricky since we get here on INIT_PORT and
1191		 * in such case we can't tell the OS the port is up.
1192		 * To solve this there is a call to if_link_state_change
1193		 * in set_rx_mode.
1194		 * */
1195		} else if (priv->port_up && (linkstate == MLX4_DEV_EVENT_PORT_UP)){
1196			en_info(priv, "Link Up\n");
1197			if_link_state_change(priv->dev, LINK_STATE_UP);
1198		}
1199	}
1200	priv->last_link_state = linkstate;
1201	mutex_unlock(&mdev->state_lock);
1202}
1203
1204
1205int mlx4_en_start_port(struct net_device *dev)
1206{
1207	struct mlx4_en_priv *priv = netdev_priv(dev);
1208	struct mlx4_en_dev *mdev = priv->mdev;
1209	struct mlx4_en_cq *cq;
1210	struct mlx4_en_tx_ring *tx_ring;
1211	int rx_index = 0;
1212	int tx_index = 0;
1213	int err = 0;
1214	int i;
1215	int j;
1216	u8 mc_list[16] = {0};
1217
1218
1219	if (priv->port_up) {
1220		en_dbg(DRV, priv, "start port called while port already up\n");
1221		return 0;
1222	}
1223
1224	INIT_LIST_HEAD(&priv->mc_list);
1225	INIT_LIST_HEAD(&priv->curr_list);
1226	INIT_LIST_HEAD(&priv->ethtool_list);
1227
1228	/* Calculate Rx buf size */
1229	dev->if_mtu = min(dev->if_mtu, priv->max_mtu);
1230        mlx4_en_calc_rx_buf(dev);
1231	priv->rx_alloc_size = max_t(int, 2 * roundup_pow_of_two(priv->rx_mb_size),
1232				    PAGE_SIZE);
1233	priv->rx_alloc_order = get_order(priv->rx_alloc_size);
1234	priv->rx_buf_size = roundup_pow_of_two(priv->rx_mb_size);
1235	priv->log_rx_info = ROUNDUP_LOG2(sizeof(struct mlx4_en_rx_buf));
1236	en_dbg(DRV, priv, "Rx buf size:%d\n", priv->rx_mb_size);
1237
1238	/* Configure rx cq's and rings */
1239	err = mlx4_en_activate_rx_rings(priv);
1240	if (err) {
1241		en_err(priv, "Failed to activate RX rings\n");
1242		return err;
1243	}
1244	for (i = 0; i < priv->rx_ring_num; i++) {
1245		cq = priv->rx_cq[i];
1246
1247		mlx4_en_cq_init_lock(cq);
1248		err = mlx4_en_activate_cq(priv, cq, i);
1249		if (err) {
1250			en_err(priv, "Failed activating Rx CQ\n");
1251			goto cq_err;
1252		}
1253		for (j = 0; j < cq->size; j++)
1254			cq->buf[j].owner_sr_opcode = MLX4_CQE_OWNER_MASK;
1255		err = mlx4_en_set_cq_moder(priv, cq);
1256		if (err) {
1257			en_err(priv, "Failed setting cq moderation parameters");
1258			mlx4_en_deactivate_cq(priv, cq);
1259			goto cq_err;
1260		}
1261		mlx4_en_arm_cq(priv, cq);
1262		priv->rx_ring[i]->cqn = cq->mcq.cqn;
1263		++rx_index;
1264	}
1265
1266	/* Set qp number */
1267	en_dbg(DRV, priv, "Getting qp number for port %d\n", priv->port);
1268	err = mlx4_en_get_qp(priv);
1269	if (err) {
1270		en_err(priv, "Failed getting eth qp\n");
1271		goto cq_err;
1272	}
1273	mdev->mac_removed[priv->port] = 0;
1274
1275	/* gets default allocated counter index from func cap */
1276	/* or sink counter index if no resources */
1277	priv->counter_index = mdev->dev->caps.def_counter_index[priv->port - 1];
1278
1279	en_dbg(DRV, priv, "%s: default counter index %d for port %d\n",
1280	       __func__, priv->counter_index, priv->port);
1281
1282	err = mlx4_en_config_rss_steer(priv);
1283	if (err) {
1284		en_err(priv, "Failed configuring rss steering\n");
1285		goto mac_err;
1286	}
1287
1288	err = mlx4_en_create_drop_qp(priv);
1289	if (err)
1290		goto rss_err;
1291
1292	/* Configure tx cq's and rings */
1293	for (i = 0; i < priv->tx_ring_num; i++) {
1294		/* Configure cq */
1295		cq = priv->tx_cq[i];
1296		err = mlx4_en_activate_cq(priv, cq, i);
1297		if (err) {
1298			en_err(priv, "Failed allocating Tx CQ\n");
1299			goto tx_err;
1300		}
1301		err = mlx4_en_set_cq_moder(priv, cq);
1302		if (err) {
1303			en_err(priv, "Failed setting cq moderation parameters");
1304			mlx4_en_deactivate_cq(priv, cq);
1305			goto tx_err;
1306		}
1307		en_dbg(DRV, priv, "Resetting index of collapsed CQ:%d to -1\n", i);
1308		cq->buf->wqe_index = cpu_to_be16(0xffff);
1309
1310		/* Configure ring */
1311		tx_ring = priv->tx_ring[i];
1312
1313		err = mlx4_en_activate_tx_ring(priv, tx_ring, cq->mcq.cqn,
1314					       i / priv->num_tx_rings_p_up);
1315		if (err) {
1316			en_err(priv, "Failed allocating Tx ring\n");
1317			mlx4_en_deactivate_cq(priv, cq);
1318			goto tx_err;
1319		}
1320
1321		/* Arm CQ for TX completions */
1322		mlx4_en_arm_cq(priv, cq);
1323
1324		/* Set initial ownership of all Tx TXBBs to SW (1) */
1325		for (j = 0; j < tx_ring->buf_size; j += STAMP_STRIDE)
1326			*((u32 *) (tx_ring->buf + j)) = 0xffffffff;
1327		++tx_index;
1328	}
1329
1330	/* Configure port */
1331	err = mlx4_SET_PORT_general(mdev->dev, priv->port,
1332				    priv->rx_mb_size,
1333				    priv->prof->tx_pause,
1334				    priv->prof->tx_ppp,
1335				    priv->prof->rx_pause,
1336				    priv->prof->rx_ppp);
1337	if (err) {
1338		en_err(priv, "Failed setting port general configurations for port %d, with error %d\n",
1339		       priv->port, err);
1340		goto tx_err;
1341	}
1342	/* Set default qp number */
1343	err = mlx4_SET_PORT_qpn_calc(mdev->dev, priv->port, priv->base_qpn, 0);
1344	if (err) {
1345		en_err(priv, "Failed setting default qp numbers\n");
1346		goto tx_err;
1347	}
1348
1349	/* Init port */
1350	en_dbg(HW, priv, "Initializing port\n");
1351	err = mlx4_INIT_PORT(mdev->dev, priv->port);
1352	if (err) {
1353		en_err(priv, "Failed Initializing port\n");
1354		goto tx_err;
1355	}
1356
1357	/* Attach rx QP to bradcast address */
1358	memset(&mc_list[10], 0xff, ETH_ALEN);
1359	mc_list[5] = priv->port; /* needed for B0 steering support */
1360	if (mlx4_multicast_attach(mdev->dev, &priv->rss_map.indir_qp, mc_list,
1361				  priv->port, 0, MLX4_PROT_ETH,
1362				  &priv->broadcast_id))
1363		mlx4_warn(mdev, "Failed Attaching Broadcast\n");
1364
1365	/* Must redo promiscuous mode setup. */
1366	priv->flags &= ~(MLX4_EN_FLAG_PROMISC | MLX4_EN_FLAG_MC_PROMISC);
1367
1368	/* Schedule multicast task to populate multicast list */
1369	queue_work(mdev->workqueue, &priv->rx_mode_task);
1370
1371	mlx4_set_stats_bitmap(mdev->dev, priv->stats_bitmap);
1372
1373	priv->port_up = true;
1374
1375        /* Enable the queues. */
1376        dev->if_drv_flags &= ~IFF_DRV_OACTIVE;
1377        dev->if_drv_flags |= IFF_DRV_RUNNING;
1378#ifdef CONFIG_DEBUG_FS
1379	mlx4_en_create_debug_files(priv);
1380#endif
1381        callout_reset(&priv->watchdog_timer, MLX4_EN_WATCHDOG_TIMEOUT,
1382                    mlx4_en_watchdog_timeout, priv);
1383
1384
1385	return 0;
1386
1387tx_err:
1388	while (tx_index--) {
1389		mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[tx_index]);
1390		mlx4_en_deactivate_cq(priv, priv->tx_cq[tx_index]);
1391	}
1392	mlx4_en_destroy_drop_qp(priv);
1393rss_err:
1394	mlx4_en_release_rss_steer(priv);
1395mac_err:
1396	mlx4_en_put_qp(priv);
1397cq_err:
1398	while (rx_index--)
1399		mlx4_en_deactivate_cq(priv, priv->rx_cq[rx_index]);
1400	for (i = 0; i < priv->rx_ring_num; i++)
1401		mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]);
1402
1403	return err; /* need to close devices */
1404}
1405
1406
1407void mlx4_en_stop_port(struct net_device *dev)
1408{
1409	struct mlx4_en_priv *priv = netdev_priv(dev);
1410	struct mlx4_en_dev *mdev = priv->mdev;
1411	struct mlx4_en_mc_list *mclist, *tmp;
1412	int i;
1413	u8 mc_list[16] = {0};
1414
1415	if (!priv->port_up) {
1416		en_dbg(DRV, priv, "stop port called while port already down\n");
1417		return;
1418	}
1419
1420#ifdef CONFIG_DEBUG_FS
1421	mlx4_en_delete_debug_files(priv);
1422#endif
1423
1424	/* close port*/
1425	mlx4_CLOSE_PORT(mdev->dev, priv->port);
1426
1427	/* Set port as not active */
1428	priv->port_up = false;
1429	if (priv->counter_index != 0xff) {
1430		mlx4_counter_free(mdev->dev, priv->port, priv->counter_index);
1431		priv->counter_index = 0xff;
1432	}
1433
1434	/* Promsicuous mode */
1435	if (mdev->dev->caps.steering_mode ==
1436	    MLX4_STEERING_MODE_DEVICE_MANAGED) {
1437		priv->flags &= ~(MLX4_EN_FLAG_PROMISC |
1438				 MLX4_EN_FLAG_MC_PROMISC);
1439		mlx4_flow_steer_promisc_remove(mdev->dev,
1440					       priv->port,
1441					       MLX4_FS_ALL_DEFAULT);
1442		mlx4_flow_steer_promisc_remove(mdev->dev,
1443					       priv->port,
1444					       MLX4_FS_MC_DEFAULT);
1445	} else if (priv->flags & MLX4_EN_FLAG_PROMISC) {
1446		priv->flags &= ~MLX4_EN_FLAG_PROMISC;
1447
1448		/* Disable promiscouos mode */
1449		mlx4_unicast_promisc_remove(mdev->dev, priv->base_qpn,
1450					    priv->port);
1451
1452		/* Disable Multicast promisc */
1453		if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) {
1454			mlx4_multicast_promisc_remove(mdev->dev, priv->base_qpn,
1455						      priv->port);
1456			priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC;
1457		}
1458	}
1459
1460	/* Detach All multicasts */
1461	memset(&mc_list[10], 0xff, ETH_ALEN);
1462	mc_list[5] = priv->port; /* needed for B0 steering support */
1463	mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp, mc_list,
1464			      MLX4_PROT_ETH, priv->broadcast_id);
1465	list_for_each_entry(mclist, &priv->curr_list, list) {
1466		memcpy(&mc_list[10], mclist->addr, ETH_ALEN);
1467		mc_list[5] = priv->port;
1468		mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp,
1469				      mc_list, MLX4_PROT_ETH, mclist->reg_id);
1470	}
1471	mlx4_en_clear_list(dev);
1472	list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) {
1473		list_del(&mclist->list);
1474		kfree(mclist);
1475	}
1476
1477	/* Flush multicast filter */
1478	mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1, MLX4_MCAST_CONFIG);
1479	mlx4_en_destroy_drop_qp(priv);
1480
1481	/* Free TX Rings */
1482	for (i = 0; i < priv->tx_ring_num; i++) {
1483		mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[i]);
1484		mlx4_en_deactivate_cq(priv, priv->tx_cq[i]);
1485	}
1486	msleep(10);
1487
1488	for (i = 0; i < priv->tx_ring_num; i++)
1489		mlx4_en_free_tx_buf(dev, priv->tx_ring[i]);
1490
1491	/* Free RSS qps */
1492	mlx4_en_release_rss_steer(priv);
1493
1494	/* Unregister Mac address for the port */
1495	mlx4_en_put_qp(priv);
1496	mdev->mac_removed[priv->port] = 1;
1497
1498	/* Free RX Rings */
1499	for (i = 0; i < priv->rx_ring_num; i++) {
1500		struct mlx4_en_cq *cq = priv->rx_cq[i];
1501		mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]);
1502		mlx4_en_deactivate_cq(priv, cq);
1503	}
1504
1505        callout_stop(&priv->watchdog_timer);
1506
1507        dev->if_drv_flags &= ~(IFF_DRV_RUNNING | IFF_DRV_OACTIVE);
1508}
1509
1510static void mlx4_en_restart(struct work_struct *work)
1511{
1512	struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv,
1513						 watchdog_task);
1514	struct mlx4_en_dev *mdev = priv->mdev;
1515	struct net_device *dev = priv->dev;
1516	struct mlx4_en_tx_ring *ring;
1517	int i;
1518
1519
1520	if (priv->blocked == 0 || priv->port_up == 0)
1521		return;
1522	for (i = 0; i < priv->tx_ring_num; i++) {
1523		ring = priv->tx_ring[i];
1524		if (ring->blocked &&
1525				ring->watchdog_time + MLX4_EN_WATCHDOG_TIMEOUT < ticks)
1526			goto reset;
1527	}
1528	return;
1529
1530reset:
1531	priv->port_stats.tx_timeout++;
1532	en_dbg(DRV, priv, "Watchdog task called for port %d\n", priv->port);
1533
1534	mutex_lock(&mdev->state_lock);
1535	if (priv->port_up) {
1536		mlx4_en_stop_port(dev);
1537                //for (i = 0; i < priv->tx_ring_num; i++)
1538                //        netdev_tx_reset_queue(priv->tx_ring[i]->tx_queue);
1539		if (mlx4_en_start_port(dev))
1540			en_err(priv, "Failed restarting port %d\n", priv->port);
1541	}
1542	mutex_unlock(&mdev->state_lock);
1543}
1544
1545static void mlx4_en_clear_stats(struct net_device *dev)
1546{
1547	struct mlx4_en_priv *priv = netdev_priv(dev);
1548	struct mlx4_en_dev *mdev = priv->mdev;
1549	int i;
1550
1551	if (!mlx4_is_slave(mdev->dev))
1552		if (mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 1))
1553			en_dbg(HW, priv, "Failed dumping statistics\n");
1554
1555	memset(&priv->pstats, 0, sizeof(priv->pstats));
1556	memset(&priv->pkstats, 0, sizeof(priv->pkstats));
1557	memset(&priv->port_stats, 0, sizeof(priv->port_stats));
1558	memset(&priv->vport_stats, 0, sizeof(priv->vport_stats));
1559
1560	for (i = 0; i < priv->tx_ring_num; i++) {
1561		priv->tx_ring[i]->bytes = 0;
1562		priv->tx_ring[i]->packets = 0;
1563		priv->tx_ring[i]->tx_csum = 0;
1564	}
1565	for (i = 0; i < priv->rx_ring_num; i++) {
1566		priv->rx_ring[i]->bytes = 0;
1567		priv->rx_ring[i]->packets = 0;
1568		priv->rx_ring[i]->csum_ok = 0;
1569		priv->rx_ring[i]->csum_none = 0;
1570	}
1571}
1572
1573static void mlx4_en_open(void* arg)
1574{
1575
1576        struct mlx4_en_priv *priv;
1577        struct mlx4_en_dev *mdev;
1578        struct net_device *dev;
1579        int err = 0;
1580
1581        priv = arg;
1582        mdev = priv->mdev;
1583        dev = priv->dev;
1584
1585
1586	mutex_lock(&mdev->state_lock);
1587
1588	if (!mdev->device_up) {
1589		en_err(priv, "Cannot open - device down/disabled\n");
1590		goto out;
1591	}
1592
1593	/* Reset HW statistics and SW counters */
1594	mlx4_en_clear_stats(dev);
1595
1596	err = mlx4_en_start_port(dev);
1597	if (err)
1598		en_err(priv, "Failed starting port:%d\n", priv->port);
1599
1600out:
1601	mutex_unlock(&mdev->state_lock);
1602	return;
1603}
1604
1605void mlx4_en_free_resources(struct mlx4_en_priv *priv)
1606{
1607	int i;
1608
1609#ifdef CONFIG_RFS_ACCEL
1610	if (priv->dev->rx_cpu_rmap) {
1611		free_irq_cpu_rmap(priv->dev->rx_cpu_rmap);
1612		priv->dev->rx_cpu_rmap = NULL;
1613	}
1614#endif
1615
1616	for (i = 0; i < priv->tx_ring_num; i++) {
1617		if (priv->tx_ring && priv->tx_ring[i])
1618			mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]);
1619		if (priv->tx_cq && priv->tx_cq[i])
1620			mlx4_en_destroy_cq(priv, &priv->tx_cq[i]);
1621	}
1622
1623	for (i = 0; i < priv->rx_ring_num; i++) {
1624		if (priv->rx_ring[i])
1625			mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i],
1626				priv->prof->rx_ring_size, priv->stride);
1627		if (priv->rx_cq[i])
1628			mlx4_en_destroy_cq(priv, &priv->rx_cq[i]);
1629	}
1630
1631	if (priv->sysctl)
1632		sysctl_ctx_free(&priv->stat_ctx);
1633
1634
1635}
1636
1637int mlx4_en_alloc_resources(struct mlx4_en_priv *priv)
1638{
1639	struct mlx4_en_port_profile *prof = priv->prof;
1640	int i;
1641	int node = 0;
1642
1643	/* Create rx Rings */
1644	for (i = 0; i < priv->rx_ring_num; i++) {
1645		if (mlx4_en_create_cq(priv, &priv->rx_cq[i],
1646				      prof->rx_ring_size, i, RX, node))
1647			goto err;
1648
1649		if (mlx4_en_create_rx_ring(priv, &priv->rx_ring[i],
1650					   prof->rx_ring_size, node))
1651			goto err;
1652	}
1653
1654	/* Create tx Rings */
1655	for (i = 0; i < priv->tx_ring_num; i++) {
1656		if (mlx4_en_create_cq(priv, &priv->tx_cq[i],
1657				      prof->tx_ring_size, i, TX, node))
1658			goto err;
1659
1660		if (mlx4_en_create_tx_ring(priv, &priv->tx_ring[i],
1661					   prof->tx_ring_size, TXBB_SIZE, node, i))
1662			goto err;
1663	}
1664
1665#ifdef CONFIG_RFS_ACCEL
1666	priv->dev->rx_cpu_rmap = alloc_irq_cpu_rmap(priv->rx_ring_num);
1667	if (!priv->dev->rx_cpu_rmap)
1668		goto err;
1669#endif
1670        /* Re-create stat sysctls in case the number of rings changed. */
1671	mlx4_en_sysctl_stat(priv);
1672	return 0;
1673
1674err:
1675	en_err(priv, "Failed to allocate NIC resources\n");
1676	for (i = 0; i < priv->rx_ring_num; i++) {
1677		if (priv->rx_ring[i])
1678			mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i],
1679						prof->rx_ring_size,
1680						priv->stride);
1681		if (priv->rx_cq[i])
1682			mlx4_en_destroy_cq(priv, &priv->rx_cq[i]);
1683	}
1684	for (i = 0; i < priv->tx_ring_num; i++) {
1685		if (priv->tx_ring[i])
1686			mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]);
1687		if (priv->tx_cq[i])
1688			mlx4_en_destroy_cq(priv, &priv->tx_cq[i]);
1689	}
1690	priv->port_up = false;
1691	return -ENOMEM;
1692}
1693
1694struct en_port_attribute {
1695	struct attribute attr;
1696	ssize_t (*show)(struct en_port *, struct en_port_attribute *, char *buf);
1697	ssize_t (*store)(struct en_port *, struct en_port_attribute *, char *buf, size_t count);
1698};
1699
1700#define PORT_ATTR_RO(_name) \
1701struct en_port_attribute en_port_attr_##_name = __ATTR_RO(_name)
1702
1703#define EN_PORT_ATTR(_name, _mode, _show, _store) \
1704struct en_port_attribute en_port_attr_##_name = __ATTR(_name, _mode, _show, _store)
1705
1706void mlx4_en_destroy_netdev(struct net_device *dev)
1707{
1708	struct mlx4_en_priv *priv = netdev_priv(dev);
1709	struct mlx4_en_dev *mdev = priv->mdev;
1710
1711	en_dbg(DRV, priv, "Destroying netdev on port:%d\n", priv->port);
1712
1713        if (priv->vlan_attach != NULL)
1714                EVENTHANDLER_DEREGISTER(vlan_config, priv->vlan_attach);
1715        if (priv->vlan_detach != NULL)
1716                EVENTHANDLER_DEREGISTER(vlan_unconfig, priv->vlan_detach);
1717
1718	/* Unregister device - this will close the port if it was up */
1719	if (priv->registered)
1720		ether_ifdetach(dev);
1721
1722	if (priv->allocated)
1723		mlx4_free_hwq_res(mdev->dev, &priv->res, MLX4_EN_PAGE_SIZE);
1724
1725	mutex_lock(&mdev->state_lock);
1726	mlx4_en_stop_port(dev);
1727	mutex_unlock(&mdev->state_lock);
1728
1729
1730	cancel_delayed_work(&priv->stats_task);
1731	cancel_delayed_work(&priv->service_task);
1732	/* flush any pending task for this netdev */
1733	flush_workqueue(mdev->workqueue);
1734        callout_drain(&priv->watchdog_timer);
1735
1736	/* Detach the netdev so tasks would not attempt to access it */
1737	mutex_lock(&mdev->state_lock);
1738	mdev->pndev[priv->port] = NULL;
1739	mutex_unlock(&mdev->state_lock);
1740
1741
1742	mlx4_en_free_resources(priv);
1743
1744	/* freeing the sysctl conf cannot be called from within mlx4_en_free_resources */
1745	if (priv->sysctl)
1746		sysctl_ctx_free(&priv->conf_ctx);
1747
1748	kfree(priv->tx_ring);
1749	kfree(priv->tx_cq);
1750
1751        kfree(priv);
1752        if_free(dev);
1753
1754}
1755
1756static int mlx4_en_change_mtu(struct net_device *dev, int new_mtu)
1757{
1758	struct mlx4_en_priv *priv = netdev_priv(dev);
1759	struct mlx4_en_dev *mdev = priv->mdev;
1760	int err = 0;
1761
1762	en_dbg(DRV, priv, "Change MTU called - current:%u new:%u\n",
1763	       (unsigned)dev->if_mtu, (unsigned)new_mtu);
1764
1765	if ((new_mtu < MLX4_EN_MIN_MTU) || (new_mtu > priv->max_mtu)) {
1766		en_err(priv, "Bad MTU size:%d.\n", new_mtu);
1767		return -EPERM;
1768	}
1769	mutex_lock(&mdev->state_lock);
1770	dev->if_mtu = new_mtu;
1771	if (dev->if_drv_flags & IFF_DRV_RUNNING) {
1772		if (!mdev->device_up) {
1773			/* NIC is probably restarting - let watchdog task reset
1774			 *                          * the port */
1775			en_dbg(DRV, priv, "Change MTU called with card down!?\n");
1776		} else {
1777			mlx4_en_stop_port(dev);
1778			err = mlx4_en_start_port(dev);
1779			if (err) {
1780				en_err(priv, "Failed restarting port:%d\n",
1781						priv->port);
1782				queue_work(mdev->workqueue, &priv->watchdog_task);
1783			}
1784		}
1785	}
1786	mutex_unlock(&mdev->state_lock);
1787	return 0;
1788}
1789
1790static int mlx4_en_calc_media(struct mlx4_en_priv *priv)
1791{
1792	int trans_type;
1793	int active;
1794
1795	active = IFM_ETHER;
1796	if (priv->last_link_state == MLX4_DEV_EVENT_PORT_DOWN)
1797		return (active);
1798	/*
1799	 * [ShaharK] mlx4_en_QUERY_PORT sleeps and cannot be called under a
1800	 * non-sleepable lock.
1801	 * I moved it to the periodic mlx4_en_do_get_stats.
1802 	if (mlx4_en_QUERY_PORT(priv->mdev, priv->port))
1803 		return (active);
1804	*/
1805	active |= IFM_FDX;
1806	trans_type = priv->port_state.transciver;
1807	/* XXX I don't know all of the transceiver values. */
1808	switch (priv->port_state.link_speed) {
1809	case 1000:
1810		active |= IFM_1000_T;
1811		break;
1812	case 10000:
1813		if (trans_type > 0 && trans_type <= 0xC)
1814			active |= IFM_10G_SR;
1815		else if (trans_type == 0x80 || trans_type == 0)
1816			active |= IFM_10G_CX4;
1817		break;
1818	case 40000:
1819		active |= IFM_40G_CR4;
1820		break;
1821	}
1822	if (priv->prof->tx_pause)
1823		active |= IFM_ETH_TXPAUSE;
1824	if (priv->prof->rx_pause)
1825		active |= IFM_ETH_RXPAUSE;
1826
1827	return (active);
1828}
1829
1830static void mlx4_en_media_status(struct ifnet *dev, struct ifmediareq *ifmr)
1831{
1832	struct mlx4_en_priv *priv;
1833
1834	priv = dev->if_softc;
1835	ifmr->ifm_status = IFM_AVALID;
1836	if (priv->last_link_state != MLX4_DEV_EVENT_PORT_DOWN)
1837		ifmr->ifm_status |= IFM_ACTIVE;
1838	ifmr->ifm_active = mlx4_en_calc_media(priv);
1839
1840	return;
1841}
1842
1843static int mlx4_en_media_change(struct ifnet *dev)
1844{
1845	struct mlx4_en_priv *priv;
1846        struct ifmedia *ifm;
1847	int rxpause;
1848	int txpause;
1849	int error;
1850
1851	priv = dev->if_softc;
1852	ifm = &priv->media;
1853	rxpause = txpause = 0;
1854	error = 0;
1855
1856	if (IFM_TYPE(ifm->ifm_media) != IFM_ETHER)
1857		return (EINVAL);
1858        switch (IFM_SUBTYPE(ifm->ifm_media)) {
1859        case IFM_AUTO:
1860		break;
1861	case IFM_10G_SR:
1862	case IFM_10G_CX4:
1863	case IFM_1000_T:
1864	case IFM_40G_CR4:
1865		if ((IFM_SUBTYPE(ifm->ifm_media)
1866			== IFM_SUBTYPE(mlx4_en_calc_media(priv)))
1867			&& (ifm->ifm_media & IFM_FDX))
1868			break;
1869		/* Fallthrough */
1870	default:
1871                printf("%s: Only auto media type\n", if_name(dev));
1872                return (EINVAL);
1873	}
1874	/* Allow user to set/clear pause */
1875	if (IFM_OPTIONS(ifm->ifm_media) & IFM_ETH_RXPAUSE)
1876		rxpause = 1;
1877	if (IFM_OPTIONS(ifm->ifm_media) & IFM_ETH_TXPAUSE)
1878		txpause = 1;
1879	if (priv->prof->tx_pause != txpause || priv->prof->rx_pause != rxpause) {
1880		priv->prof->tx_pause = txpause;
1881		priv->prof->rx_pause = rxpause;
1882		error = -mlx4_SET_PORT_general(priv->mdev->dev, priv->port,
1883		     priv->rx_mb_size + ETHER_CRC_LEN, priv->prof->tx_pause,
1884		     priv->prof->tx_ppp, priv->prof->rx_pause,
1885		     priv->prof->rx_ppp);
1886	}
1887	return (error);
1888}
1889
1890static int mlx4_en_ioctl(struct ifnet *dev, u_long command, caddr_t data)
1891{
1892	struct mlx4_en_priv *priv;
1893	struct mlx4_en_dev *mdev;
1894	struct ifreq *ifr;
1895	int error;
1896	int mask;
1897
1898	error = 0;
1899	mask = 0;
1900	priv = dev->if_softc;
1901	mdev = priv->mdev;
1902	ifr = (struct ifreq *) data;
1903	switch (command) {
1904
1905	case SIOCSIFMTU:
1906		error = -mlx4_en_change_mtu(dev, ifr->ifr_mtu);
1907		break;
1908	case SIOCSIFFLAGS:
1909		mutex_lock(&mdev->state_lock);
1910		if (dev->if_flags & IFF_UP) {
1911			if ((dev->if_drv_flags & IFF_DRV_RUNNING) == 0)
1912				mlx4_en_start_port(dev);
1913			else
1914				mlx4_en_set_rx_mode(dev);
1915		} else {
1916			if (dev->if_drv_flags & IFF_DRV_RUNNING) {
1917				mlx4_en_stop_port(dev);
1918                                if_link_state_change(dev, LINK_STATE_DOWN);
1919			}
1920		}
1921		mutex_unlock(&mdev->state_lock);
1922		break;
1923	case SIOCADDMULTI:
1924	case SIOCDELMULTI:
1925		mlx4_en_set_rx_mode(dev);
1926		break;
1927	case SIOCSIFMEDIA:
1928	case SIOCGIFMEDIA:
1929		error = ifmedia_ioctl(dev, ifr, &priv->media, command);
1930		break;
1931	case SIOCSIFCAP:
1932		mutex_lock(&mdev->state_lock);
1933		mask = ifr->ifr_reqcap ^ dev->if_capenable;
1934		if (mask & IFCAP_HWCSUM)
1935			dev->if_capenable ^= IFCAP_HWCSUM;
1936		if (mask & IFCAP_TSO4)
1937			dev->if_capenable ^= IFCAP_TSO4;
1938		if (mask & IFCAP_TSO6)
1939			dev->if_capenable ^= IFCAP_TSO6;
1940		if (mask & IFCAP_LRO)
1941			dev->if_capenable ^= IFCAP_LRO;
1942		if (mask & IFCAP_VLAN_HWTAGGING)
1943			dev->if_capenable ^= IFCAP_VLAN_HWTAGGING;
1944		if (mask & IFCAP_VLAN_HWFILTER)
1945			dev->if_capenable ^= IFCAP_VLAN_HWFILTER;
1946		if (mask & IFCAP_WOL_MAGIC)
1947			dev->if_capenable ^= IFCAP_WOL_MAGIC;
1948		if (dev->if_drv_flags & IFF_DRV_RUNNING)
1949			mlx4_en_start_port(dev);
1950		mutex_unlock(&mdev->state_lock);
1951		VLAN_CAPABILITIES(dev);
1952		break;
1953	default:
1954		error = ether_ioctl(dev, command, data);
1955		break;
1956	}
1957
1958	return (error);
1959}
1960
1961
1962int mlx4_en_init_netdev(struct mlx4_en_dev *mdev, int port,
1963			struct mlx4_en_port_profile *prof)
1964{
1965	struct net_device *dev;
1966	struct mlx4_en_priv *priv;
1967	uint8_t dev_addr[ETHER_ADDR_LEN];
1968	int err;
1969	int i;
1970
1971	priv = kzalloc(sizeof(*priv), GFP_KERNEL);
1972	dev = priv->dev = if_alloc(IFT_ETHER);
1973	if (dev == NULL) {
1974		en_err(priv, "Net device allocation failed\n");
1975		kfree(priv);
1976		return -ENOMEM;
1977	}
1978	dev->if_softc = priv;
1979	if_initname(dev, "mlxen", atomic_fetchadd_int(&mlx4_en_unit, 1));
1980	dev->if_mtu = ETHERMTU;
1981	dev->if_baudrate = 1000000000;
1982	dev->if_init = mlx4_en_open;
1983	dev->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
1984	dev->if_ioctl = mlx4_en_ioctl;
1985	dev->if_transmit = mlx4_en_transmit;
1986	dev->if_qflush = mlx4_en_qflush;
1987	dev->if_snd.ifq_maxlen = prof->tx_ring_size;
1988
1989	/*
1990	 * Initialize driver private data
1991	 */
1992	priv->counter_index = 0xff;
1993	spin_lock_init(&priv->stats_lock);
1994	INIT_WORK(&priv->rx_mode_task, mlx4_en_do_set_rx_mode);
1995	INIT_WORK(&priv->watchdog_task, mlx4_en_restart);
1996	INIT_WORK(&priv->linkstate_task, mlx4_en_linkstate);
1997	INIT_DELAYED_WORK(&priv->stats_task, mlx4_en_do_get_stats);
1998	INIT_DELAYED_WORK(&priv->service_task, mlx4_en_service_task);
1999	callout_init(&priv->watchdog_timer, 1);
2000#ifdef CONFIG_RFS_ACCEL
2001	INIT_LIST_HEAD(&priv->filters);
2002	spin_lock_init(&priv->filters_lock);
2003#endif
2004
2005	priv->msg_enable = MLX4_EN_MSG_LEVEL;
2006	priv->dev = dev;
2007	priv->mdev = mdev;
2008	priv->ddev = &mdev->pdev->dev;
2009	priv->prof = prof;
2010	priv->port = port;
2011	priv->port_up = false;
2012	priv->flags = prof->flags;
2013        priv->ctrl_flags = cpu_to_be32(MLX4_WQE_CTRL_CQ_UPDATE |
2014                        MLX4_WQE_CTRL_SOLICITED);
2015
2016	priv->num_tx_rings_p_up = mdev->profile.num_tx_rings_p_up;
2017	priv->tx_ring_num = prof->tx_ring_num;
2018	priv->tx_ring = kcalloc(MAX_TX_RINGS,
2019				sizeof(struct mlx4_en_tx_ring *), GFP_KERNEL);
2020	if (!priv->tx_ring) {
2021		err = -ENOMEM;
2022		goto out;
2023	}
2024	priv->tx_cq = kcalloc(sizeof(struct mlx4_en_cq *), MAX_TX_RINGS,
2025			GFP_KERNEL);
2026	if (!priv->tx_cq) {
2027		err = -ENOMEM;
2028		goto out;
2029	}
2030
2031	priv->rx_ring_num = prof->rx_ring_num;
2032	priv->cqe_factor = (mdev->dev->caps.cqe_size == 64) ? 1 : 0;
2033	priv->mac_index = -1;
2034	priv->last_ifq_jiffies = 0;
2035	priv->if_counters_rx_errors = 0;
2036	priv->if_counters_rx_no_buffer = 0;
2037#ifdef CONFIG_MLX4_EN_DCB
2038	if (!mlx4_is_slave(priv->mdev->dev)) {
2039		priv->dcbx_cap = DCB_CAP_DCBX_HOST;
2040		priv->flags |= MLX4_EN_FLAG_DCB_ENABLED;
2041		if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_ETS_CFG) {
2042			dev->dcbnl_ops = &mlx4_en_dcbnl_ops;
2043		} else {
2044			en_info(priv, "QoS disabled - no HW support\n");
2045			dev->dcbnl_ops = &mlx4_en_dcbnl_pfc_ops;
2046		}
2047	}
2048#endif
2049
2050	for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i)
2051		INIT_HLIST_HEAD(&priv->mac_hash[i]);
2052
2053
2054	/* Query for default mac and max mtu */
2055	priv->max_mtu = mdev->dev->caps.eth_mtu_cap[priv->port];
2056        priv->mac = mdev->dev->caps.def_mac[priv->port];
2057        if (ILLEGAL_MAC(priv->mac)) {
2058#if BITS_PER_LONG == 64
2059                en_err(priv, "Port: %d, invalid mac burned: 0x%lx, quiting\n",
2060                                priv->port, priv->mac);
2061#elif BITS_PER_LONG == 32
2062                en_err(priv, "Port: %d, invalid mac burned: 0x%llx, quiting\n",
2063                                priv->port, priv->mac);
2064#endif
2065                err = -EINVAL;
2066                goto out;
2067        }
2068
2069
2070
2071	priv->stride = roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc) +
2072					  DS_SIZE);
2073
2074	mlx4_en_sysctl_conf(priv);
2075
2076	err = mlx4_en_alloc_resources(priv);
2077	if (err)
2078		goto out;
2079
2080	/* Allocate page for receive rings */
2081	err = mlx4_alloc_hwq_res(mdev->dev, &priv->res,
2082				MLX4_EN_PAGE_SIZE, MLX4_EN_PAGE_SIZE);
2083	if (err) {
2084		en_err(priv, "Failed to allocate page for rx qps\n");
2085		goto out;
2086	}
2087	priv->allocated = 1;
2088
2089	/*
2090	 * Set driver features
2091	 */
2092	dev->if_capabilities |= IFCAP_RXCSUM | IFCAP_TXCSUM;
2093	dev->if_capabilities |= IFCAP_VLAN_MTU | IFCAP_VLAN_HWTAGGING;
2094	dev->if_capabilities |= IFCAP_VLAN_HWCSUM | IFCAP_VLAN_HWFILTER;
2095	dev->if_capabilities |= IFCAP_LINKSTATE | IFCAP_JUMBO_MTU;
2096	dev->if_capabilities |= IFCAP_LRO;
2097
2098	if (mdev->LSO_support)
2099		dev->if_capabilities |= IFCAP_TSO4 | IFCAP_TSO6 | IFCAP_VLAN_HWTSO;
2100#if 0
2101	/* set TSO limits so that we don't have to drop TX packets */
2102	dev->if_hw_tsomax = 65536 - (ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN);
2103	dev->if_hw_tsomaxsegcount = 16;
2104	dev->if_hw_tsomaxsegsize = 65536;       /* XXX can do up to 4GByte */
2105#endif
2106	dev->if_capenable = dev->if_capabilities;
2107
2108	dev->if_hwassist = 0;
2109	if (dev->if_capenable & (IFCAP_TSO4 | IFCAP_TSO6))
2110		dev->if_hwassist |= CSUM_TSO;
2111	if (dev->if_capenable & IFCAP_TXCSUM)
2112		dev->if_hwassist |= (CSUM_TCP | CSUM_UDP | CSUM_IP);
2113
2114
2115        /* Register for VLAN events */
2116	priv->vlan_attach = EVENTHANDLER_REGISTER(vlan_config,
2117            mlx4_en_vlan_rx_add_vid, priv, EVENTHANDLER_PRI_FIRST);
2118	priv->vlan_detach = EVENTHANDLER_REGISTER(vlan_unconfig,
2119            mlx4_en_vlan_rx_kill_vid, priv, EVENTHANDLER_PRI_FIRST);
2120
2121	mdev->pndev[priv->port] = dev;
2122
2123	priv->last_link_state = MLX4_DEV_EVENT_PORT_DOWN;
2124        mlx4_en_set_default_moderation(priv);
2125
2126	/* Set default MAC */
2127	for (i = 0; i < ETHER_ADDR_LEN; i++)
2128		dev_addr[ETHER_ADDR_LEN - 1 - i] = (u8) (priv->mac >> (8 * i));
2129
2130
2131	ether_ifattach(dev, dev_addr);
2132	if_link_state_change(dev, LINK_STATE_DOWN);
2133	ifmedia_init(&priv->media, IFM_IMASK | IFM_ETH_FMASK,
2134	    mlx4_en_media_change, mlx4_en_media_status);
2135	ifmedia_add(&priv->media, IFM_ETHER | IFM_FDX | IFM_1000_T, 0, NULL);
2136	ifmedia_add(&priv->media, IFM_ETHER | IFM_FDX | IFM_10G_SR, 0, NULL);
2137	ifmedia_add(&priv->media, IFM_ETHER | IFM_FDX | IFM_10G_CX4, 0, NULL);
2138	ifmedia_add(&priv->media, IFM_ETHER | IFM_FDX | IFM_40G_CR4, 0, NULL);
2139	ifmedia_add(&priv->media, IFM_ETHER | IFM_AUTO, 0, NULL);
2140	ifmedia_set(&priv->media, IFM_ETHER | IFM_AUTO);
2141
2142	en_warn(priv, "Using %d TX rings\n", prof->tx_ring_num);
2143	en_warn(priv, "Using %d RX rings\n", prof->rx_ring_num);
2144
2145	priv->registered = 1;
2146
2147        en_warn(priv, "Using %d TX rings\n", prof->tx_ring_num);
2148        en_warn(priv, "Using %d RX rings\n", prof->rx_ring_num);
2149
2150
2151	priv->rx_mb_size = dev->if_mtu + ETH_HLEN + VLAN_HLEN + ETH_FCS_LEN;
2152	err = mlx4_SET_PORT_general(mdev->dev, priv->port,
2153				    priv->rx_mb_size,
2154				    prof->tx_pause, prof->tx_ppp,
2155				    prof->rx_pause, prof->rx_ppp);
2156	if (err) {
2157		en_err(priv, "Failed setting port general configurations "
2158		       "for port %d, with error %d\n", priv->port, err);
2159		goto out;
2160	}
2161
2162	/* Init port */
2163	en_warn(priv, "Initializing port\n");
2164	err = mlx4_INIT_PORT(mdev->dev, priv->port);
2165	if (err) {
2166		en_err(priv, "Failed Initializing port\n");
2167		goto out;
2168	}
2169
2170	queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY);
2171
2172        if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS)
2173                queue_delayed_work(mdev->workqueue, &priv->service_task, SERVICE_TASK_DELAY);
2174
2175
2176
2177	return 0;
2178
2179out:
2180	mlx4_en_destroy_netdev(dev);
2181	return err;
2182}
2183static int mlx4_en_set_ring_size(struct net_device *dev,
2184    int rx_size, int tx_size)
2185{
2186        struct mlx4_en_priv *priv = netdev_priv(dev);
2187        struct mlx4_en_dev *mdev = priv->mdev;
2188        int port_up = 0;
2189        int err = 0;
2190
2191        rx_size = roundup_pow_of_two(rx_size);
2192        rx_size = max_t(u32, rx_size, MLX4_EN_MIN_RX_SIZE);
2193        rx_size = min_t(u32, rx_size, MLX4_EN_MAX_RX_SIZE);
2194        tx_size = roundup_pow_of_two(tx_size);
2195        tx_size = max_t(u32, tx_size, MLX4_EN_MIN_TX_SIZE);
2196        tx_size = min_t(u32, tx_size, MLX4_EN_MAX_TX_SIZE);
2197
2198        if (rx_size == (priv->port_up ?
2199            priv->rx_ring[0]->actual_size : priv->rx_ring[0]->size) &&
2200            tx_size == priv->tx_ring[0]->size)
2201                return 0;
2202        mutex_lock(&mdev->state_lock);
2203        if (priv->port_up) {
2204                port_up = 1;
2205                mlx4_en_stop_port(dev);
2206        }
2207        mlx4_en_free_resources(priv);
2208        priv->prof->tx_ring_size = tx_size;
2209        priv->prof->rx_ring_size = rx_size;
2210        err = mlx4_en_alloc_resources(priv);
2211        if (err) {
2212                en_err(priv, "Failed reallocating port resources\n");
2213                goto out;
2214        }
2215        if (port_up) {
2216                err = mlx4_en_start_port(dev);
2217                if (err)
2218                        en_err(priv, "Failed starting port\n");
2219        }
2220out:
2221        mutex_unlock(&mdev->state_lock);
2222        return err;
2223}
2224static int mlx4_en_set_rx_ring_size(SYSCTL_HANDLER_ARGS)
2225{
2226        struct mlx4_en_priv *priv;
2227        int size;
2228        int error;
2229
2230        priv = arg1;
2231        size = priv->prof->rx_ring_size;
2232        error = sysctl_handle_int(oidp, &size, 0, req);
2233        if (error || !req->newptr)
2234                return (error);
2235        error = -mlx4_en_set_ring_size(priv->dev, size,
2236            priv->prof->tx_ring_size);
2237        return (error);
2238}
2239
2240static int mlx4_en_set_tx_ring_size(SYSCTL_HANDLER_ARGS)
2241{
2242        struct mlx4_en_priv *priv;
2243        int size;
2244        int error;
2245
2246        priv = arg1;
2247        size = priv->prof->tx_ring_size;
2248        error = sysctl_handle_int(oidp, &size, 0, req);
2249        if (error || !req->newptr)
2250                return (error);
2251        error = -mlx4_en_set_ring_size(priv->dev, priv->prof->rx_ring_size,
2252            size);
2253
2254        return (error);
2255}
2256
2257static int mlx4_en_set_tx_ppp(SYSCTL_HANDLER_ARGS)
2258{
2259        struct mlx4_en_priv *priv;
2260        int ppp;
2261        int error;
2262
2263        priv = arg1;
2264        ppp = priv->prof->tx_ppp;
2265        error = sysctl_handle_int(oidp, &ppp, 0, req);
2266        if (error || !req->newptr)
2267                return (error);
2268        if (ppp > 0xff || ppp < 0)
2269                return (-EINVAL);
2270        priv->prof->tx_ppp = ppp;
2271        error = -mlx4_SET_PORT_general(priv->mdev->dev, priv->port,
2272                                       priv->rx_mb_size + ETHER_CRC_LEN,
2273                                       priv->prof->tx_pause,
2274                                       priv->prof->tx_ppp,
2275                                       priv->prof->rx_pause,
2276                                       priv->prof->rx_ppp);
2277
2278        return (error);
2279}
2280
2281static int mlx4_en_set_rx_ppp(SYSCTL_HANDLER_ARGS)
2282{
2283        struct mlx4_en_priv *priv;
2284        struct mlx4_en_dev *mdev;
2285        int ppp;
2286        int error;
2287        int port_up;
2288
2289        port_up = 0;
2290        priv = arg1;
2291        mdev = priv->mdev;
2292        ppp = priv->prof->rx_ppp;
2293        error = sysctl_handle_int(oidp, &ppp, 0, req);
2294        if (error || !req->newptr)
2295                return (error);
2296        if (ppp > 0xff || ppp < 0)
2297                return (-EINVAL);
2298        /* See if we have to change the number of tx queues. */
2299        if (!ppp != !priv->prof->rx_ppp) {
2300                mutex_lock(&mdev->state_lock);
2301                if (priv->port_up) {
2302                        port_up = 1;
2303                        mlx4_en_stop_port(priv->dev);
2304                }
2305                mlx4_en_free_resources(priv);
2306                priv->prof->rx_ppp = ppp;
2307                error = -mlx4_en_alloc_resources(priv);
2308                if (error)
2309                        en_err(priv, "Failed reallocating port resources\n");
2310                if (error == 0 && port_up) {
2311                        error = -mlx4_en_start_port(priv->dev);
2312                        if (error)
2313                                en_err(priv, "Failed starting port\n");
2314                }
2315                mutex_unlock(&mdev->state_lock);
2316                return (error);
2317
2318        }
2319        priv->prof->rx_ppp = ppp;
2320        error = -mlx4_SET_PORT_general(priv->mdev->dev, priv->port,
2321                                       priv->rx_mb_size + ETHER_CRC_LEN,
2322                                       priv->prof->tx_pause,
2323                                       priv->prof->tx_ppp,
2324                                       priv->prof->rx_pause,
2325                                       priv->prof->rx_ppp);
2326
2327        return (error);
2328}
2329
2330static void mlx4_en_sysctl_conf(struct mlx4_en_priv *priv)
2331{
2332        struct net_device *dev;
2333        struct sysctl_ctx_list *ctx;
2334        struct sysctl_oid *node;
2335        struct sysctl_oid_list *node_list;
2336        struct sysctl_oid *coal;
2337        struct sysctl_oid_list *coal_list;
2338	const char *pnameunit;
2339
2340        dev = priv->dev;
2341        ctx = &priv->conf_ctx;
2342	pnameunit = device_get_nameunit(priv->mdev->pdev->dev.bsddev);
2343
2344        sysctl_ctx_init(ctx);
2345        priv->sysctl = SYSCTL_ADD_NODE(ctx, SYSCTL_STATIC_CHILDREN(_hw),
2346            OID_AUTO, dev->if_xname, CTLFLAG_RD, 0, "mlx4 10gig ethernet");
2347        node = SYSCTL_ADD_NODE(ctx, SYSCTL_CHILDREN(priv->sysctl), OID_AUTO,
2348            "conf", CTLFLAG_RD, NULL, "Configuration");
2349        node_list = SYSCTL_CHILDREN(node);
2350
2351        SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "msg_enable",
2352            CTLFLAG_RW, &priv->msg_enable, 0,
2353            "Driver message enable bitfield");
2354        SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "rx_rings",
2355            CTLFLAG_RD, &priv->rx_ring_num, 0,
2356            "Number of receive rings");
2357        SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "tx_rings",
2358            CTLFLAG_RD, &priv->tx_ring_num, 0,
2359            "Number of transmit rings");
2360        SYSCTL_ADD_PROC(ctx, node_list, OID_AUTO, "rx_size",
2361            CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv, 0,
2362            mlx4_en_set_rx_ring_size, "I", "Receive ring size");
2363        SYSCTL_ADD_PROC(ctx, node_list, OID_AUTO, "tx_size",
2364            CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv, 0,
2365            mlx4_en_set_tx_ring_size, "I", "Transmit ring size");
2366        SYSCTL_ADD_PROC(ctx, node_list, OID_AUTO, "tx_ppp",
2367            CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv, 0,
2368            mlx4_en_set_tx_ppp, "I", "TX Per-priority pause");
2369        SYSCTL_ADD_PROC(ctx, node_list, OID_AUTO, "rx_ppp",
2370            CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv, 0,
2371            mlx4_en_set_rx_ppp, "I", "RX Per-priority pause");
2372        SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "port_num",
2373            CTLFLAG_RD, &priv->port, 0,
2374            "Port Number");
2375        SYSCTL_ADD_STRING(ctx, node_list, OID_AUTO, "device_name",
2376	    CTLFLAG_RD, __DECONST(void *, pnameunit), 0,
2377	    "PCI device name");
2378
2379        /* Add coalescer configuration. */
2380        coal = SYSCTL_ADD_NODE(ctx, node_list, OID_AUTO,
2381            "coalesce", CTLFLAG_RD, NULL, "Interrupt coalesce configuration");
2382        coal_list = SYSCTL_CHILDREN(node);
2383        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "pkt_rate_low",
2384            CTLFLAG_RW, &priv->pkt_rate_low, 0,
2385            "Packets per-second for minimum delay");
2386        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "rx_usecs_low",
2387            CTLFLAG_RW, &priv->rx_usecs_low, 0,
2388            "Minimum RX delay in micro-seconds");
2389        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "pkt_rate_high",
2390            CTLFLAG_RW, &priv->pkt_rate_high, 0,
2391            "Packets per-second for maximum delay");
2392        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "rx_usecs_high",
2393            CTLFLAG_RW, &priv->rx_usecs_high, 0,
2394            "Maximum RX delay in micro-seconds");
2395        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "sample_interval",
2396            CTLFLAG_RW, &priv->sample_interval, 0,
2397            "adaptive frequency in units of HZ ticks");
2398        SYSCTL_ADD_UINT(ctx, coal_list, OID_AUTO, "adaptive_rx_coal",
2399            CTLFLAG_RW, &priv->adaptive_rx_coal, 0,
2400            "Enable adaptive rx coalescing");
2401}
2402
2403
2404static void mlx4_en_sysctl_stat(struct mlx4_en_priv *priv)
2405{
2406	struct net_device *dev;
2407	struct sysctl_ctx_list *ctx;
2408	struct sysctl_oid *node;
2409	struct sysctl_oid_list *node_list;
2410	struct sysctl_oid *ring_node;
2411	struct sysctl_oid_list *ring_list;
2412	struct mlx4_en_tx_ring *tx_ring;
2413	struct mlx4_en_rx_ring *rx_ring;
2414	char namebuf[128];
2415	int i;
2416
2417	dev = priv->dev;
2418
2419	ctx = &priv->stat_ctx;
2420	sysctl_ctx_init(ctx);
2421	node = SYSCTL_ADD_NODE(ctx, SYSCTL_CHILDREN(priv->sysctl), OID_AUTO,
2422	    "stat", CTLFLAG_RD, NULL, "Statistics");
2423	node_list = SYSCTL_CHILDREN(node);
2424
2425#ifdef MLX4_EN_PERF_STAT
2426	SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "tx_poll", CTLFLAG_RD,
2427	    &priv->pstats.tx_poll, "TX Poll calls");
2428	SYSCTL_ADD_QUAD(ctx, node_list, OID_AUTO, "tx_pktsz_avg", CTLFLAG_RD,
2429	    &priv->pstats.tx_pktsz_avg, "TX average packet size");
2430	SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "inflight_avg", CTLFLAG_RD,
2431	    &priv->pstats.inflight_avg, "TX average packets in-flight");
2432	SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "tx_coal_avg", CTLFLAG_RD,
2433	    &priv->pstats.tx_coal_avg, "TX average coalesced completions");
2434	SYSCTL_ADD_UINT(ctx, node_list, OID_AUTO, "rx_coal_avg", CTLFLAG_RD,
2435	    &priv->pstats.rx_coal_avg, "RX average coalesced completions");
2436#endif
2437
2438	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tso_packets", CTLFLAG_RD,
2439	    &priv->port_stats.tso_packets, "TSO packets sent");
2440	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "queue_stopped", CTLFLAG_RD,
2441	    &priv->port_stats.queue_stopped, "Queue full");
2442	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "wake_queue", CTLFLAG_RD,
2443	    &priv->port_stats.wake_queue, "Queue resumed after full");
2444	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_timeout", CTLFLAG_RD,
2445	    &priv->port_stats.tx_timeout, "Transmit timeouts");
2446	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_alloc_failed", CTLFLAG_RD,
2447	    &priv->port_stats.rx_alloc_failed, "RX failed to allocate mbuf");
2448	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_chksum_good", CTLFLAG_RD,
2449	    &priv->port_stats.rx_chksum_good, "RX checksum offload success");
2450	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_chksum_none", CTLFLAG_RD,
2451	    &priv->port_stats.rx_chksum_none, "RX without checksum offload");
2452	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_chksum_offload",
2453	    CTLFLAG_RD, &priv->port_stats.tx_chksum_offload,
2454	    "TX checksum offloads");
2455
2456	/* Could strdup the names and add in a loop.  This is simpler. */
2457	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_bytes", CTLFLAG_RD,
2458	    &priv->pkstats.rx_bytes, "RX Bytes");
2459	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_packets", CTLFLAG_RD,
2460	    &priv->pkstats.rx_packets, "RX packets");
2461	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_multicast_packets", CTLFLAG_RD,
2462	    &priv->pkstats.rx_multicast_packets, "RX Multicast Packets");
2463	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_broadcast_packets", CTLFLAG_RD,
2464	    &priv->pkstats.rx_broadcast_packets, "RX Broadcast Packets");
2465	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_errors", CTLFLAG_RD,
2466	    &priv->pkstats.rx_errors, "RX Errors");
2467	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_dropped", CTLFLAG_RD,
2468	    &priv->pkstats.rx_dropped, "RX Dropped");
2469	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_length_errors", CTLFLAG_RD,
2470	    &priv->pkstats.rx_length_errors, "RX Length Errors");
2471	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_over_errors", CTLFLAG_RD,
2472	    &priv->pkstats.rx_over_errors, "RX Over Errors");
2473	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_crc_errors", CTLFLAG_RD,
2474	    &priv->pkstats.rx_crc_errors, "RX CRC Errors");
2475	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_jabbers", CTLFLAG_RD,
2476	    &priv->pkstats.rx_jabbers, "RX Jabbers");
2477
2478
2479	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_in_range_length_error", CTLFLAG_RD,
2480	    &priv->pkstats.rx_in_range_length_error, "RX IN_Range Length Error");
2481	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_out_range_length_error",
2482		CTLFLAG_RD, &priv->pkstats.rx_out_range_length_error,
2483		"RX Out Range Length Error");
2484	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_lt_64_bytes_packets", CTLFLAG_RD,
2485	    &priv->pkstats.rx_lt_64_bytes_packets, "RX Lt 64 Bytes Packets");
2486	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_127_bytes_packets", CTLFLAG_RD,
2487	    &priv->pkstats.rx_127_bytes_packets, "RX 127 bytes Packets");
2488	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_255_bytes_packets", CTLFLAG_RD,
2489	    &priv->pkstats.rx_255_bytes_packets, "RX 255 bytes Packets");
2490	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_511_bytes_packets", CTLFLAG_RD,
2491	    &priv->pkstats.rx_511_bytes_packets, "RX 511 bytes Packets");
2492	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_1023_bytes_packets", CTLFLAG_RD,
2493	    &priv->pkstats.rx_1023_bytes_packets, "RX 1023 bytes Packets");
2494	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_1518_bytes_packets", CTLFLAG_RD,
2495	    &priv->pkstats.rx_1518_bytes_packets, "RX 1518 bytes Packets");
2496	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_1522_bytes_packets", CTLFLAG_RD,
2497	    &priv->pkstats.rx_1522_bytes_packets, "RX 1522 bytes Packets");
2498	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_1548_bytes_packets", CTLFLAG_RD,
2499	    &priv->pkstats.rx_1548_bytes_packets, "RX 1548 bytes Packets");
2500	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "rx_gt_1548_bytes_packets", CTLFLAG_RD,
2501	    &priv->pkstats.rx_gt_1548_bytes_packets,
2502	    "RX Greater Then 1548 bytes Packets");
2503
2504struct mlx4_en_pkt_stats {
2505	unsigned long tx_packets;
2506	unsigned long tx_bytes;
2507	unsigned long tx_multicast_packets;
2508	unsigned long tx_broadcast_packets;
2509	unsigned long tx_errors;
2510	unsigned long tx_dropped;
2511	unsigned long tx_lt_64_bytes_packets;
2512	unsigned long tx_127_bytes_packets;
2513	unsigned long tx_255_bytes_packets;
2514	unsigned long tx_511_bytes_packets;
2515	unsigned long tx_1023_bytes_packets;
2516	unsigned long tx_1518_bytes_packets;
2517	unsigned long tx_1522_bytes_packets;
2518	unsigned long tx_1548_bytes_packets;
2519	unsigned long tx_gt_1548_bytes_packets;
2520	unsigned long rx_prio[NUM_PRIORITIES][NUM_PRIORITY_STATS];
2521	unsigned long tx_prio[NUM_PRIORITIES][NUM_PRIORITY_STATS];
2522#define NUM_PKT_STATS		72
2523};
2524
2525
2526	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_packets", CTLFLAG_RD,
2527	    &priv->pkstats.tx_packets, "TX packets");
2528	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_bytes", CTLFLAG_RD,
2529	    &priv->pkstats.tx_packets, "TX Bytes");
2530	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_multicast_packets", CTLFLAG_RD,
2531	    &priv->pkstats.tx_multicast_packets, "TX Multicast Packets");
2532	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_broadcast_packets", CTLFLAG_RD,
2533	    &priv->pkstats.tx_broadcast_packets, "TX Broadcast Packets");
2534	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_errors", CTLFLAG_RD,
2535	    &priv->pkstats.tx_errors, "TX Errors");
2536	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_dropped", CTLFLAG_RD,
2537	    &priv->pkstats.tx_dropped, "TX Dropped");
2538	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_lt_64_bytes_packets", CTLFLAG_RD,
2539	    &priv->pkstats.tx_lt_64_bytes_packets, "TX Less Then 64 Bytes Packets");
2540	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_127_bytes_packets", CTLFLAG_RD,
2541	    &priv->pkstats.tx_127_bytes_packets, "TX 127 Bytes Packets");
2542	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_255_bytes_packets", CTLFLAG_RD,
2543	    &priv->pkstats.tx_255_bytes_packets, "TX 255 Bytes Packets");
2544	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_511_bytes_packets", CTLFLAG_RD,
2545	    &priv->pkstats.tx_511_bytes_packets, "TX 511 Bytes Packets");
2546	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_1023_bytes_packets", CTLFLAG_RD,
2547	    &priv->pkstats.tx_1023_bytes_packets, "TX 1023 Bytes Packets");
2548	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_1518_bytes_packets", CTLFLAG_RD,
2549	    &priv->pkstats.tx_1518_bytes_packets, "TX 1518 Bytes Packets");
2550	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_1522_bytes_packets", CTLFLAG_RD,
2551	    &priv->pkstats.tx_1522_bytes_packets, "TX 1522 Bytes Packets");
2552	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_1548_bytes_packets", CTLFLAG_RD,
2553	    &priv->pkstats.tx_1548_bytes_packets, "TX 1548 Bytes Packets");
2554	SYSCTL_ADD_ULONG(ctx, node_list, OID_AUTO, "tx_gt_1548_bytes_packets", CTLFLAG_RD,
2555	    &priv->pkstats.tx_gt_1548_bytes_packets,
2556	    "TX Greater Then 1548 Bytes Packets");
2557
2558
2559
2560	for (i = 0; i < priv->tx_ring_num; i++) {
2561		tx_ring = priv->tx_ring[i];
2562		snprintf(namebuf, sizeof(namebuf), "tx_ring%d", i);
2563		ring_node = SYSCTL_ADD_NODE(ctx, node_list, OID_AUTO, namebuf,
2564		    CTLFLAG_RD, NULL, "TX Ring");
2565		ring_list = SYSCTL_CHILDREN(ring_node);
2566		SYSCTL_ADD_ULONG(ctx, ring_list, OID_AUTO, "packets",
2567		    CTLFLAG_RD, &tx_ring->packets, "TX packets");
2568		SYSCTL_ADD_ULONG(ctx, ring_list, OID_AUTO, "bytes",
2569		    CTLFLAG_RD, &tx_ring->bytes, "TX bytes");
2570
2571	}
2572	for (i = 0; i < priv->rx_ring_num; i++) {
2573		rx_ring = priv->rx_ring[i];
2574		snprintf(namebuf, sizeof(namebuf), "rx_ring%d", i);
2575		ring_node = SYSCTL_ADD_NODE(ctx, node_list, OID_AUTO, namebuf,
2576		    CTLFLAG_RD, NULL, "RX Ring");
2577		ring_list = SYSCTL_CHILDREN(ring_node);
2578		SYSCTL_ADD_ULONG(ctx, ring_list, OID_AUTO, "packets",
2579		    CTLFLAG_RD, &rx_ring->packets, "RX packets");
2580		SYSCTL_ADD_ULONG(ctx, ring_list, OID_AUTO, "bytes",
2581		    CTLFLAG_RD, &rx_ring->bytes, "RX bytes");
2582		SYSCTL_ADD_ULONG(ctx, ring_list, OID_AUTO, "error",
2583		    CTLFLAG_RD, &rx_ring->errors, "RX soft errors");
2584	}
2585}
2586