1 /*
2 * Copyright (c) 2017, Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 */
32
33 #ifndef __MLX5E_REP_H__
34 #define __MLX5E_REP_H__
35
36 #include <net/ip_tunnels.h>
37 #include <linux/rhashtable.h>
38 #include <linux/mutex.h>
39 #include "eswitch.h"
40 #include "en.h"
41 #include "lib/port_tun.h"
42
43 #ifdef CONFIG_MLX5_ESWITCH
44 extern const struct mlx5e_rx_handlers mlx5e_rx_handlers_rep;
45
46 struct mlx5e_neigh_update_table {
47 struct rhashtable neigh_ht;
48 /* Save the neigh hash entries in a list in addition to the hash table
49 * (neigh_ht). In order to iterate easily over the neigh entries.
50 * Used for stats query.
51 */
52 struct list_head neigh_list;
53 /* protect lookup/remove operations */
54 struct mutex encap_lock;
55 struct notifier_block netevent_nb;
56 struct delayed_work neigh_stats_work;
57 unsigned long min_interval; /* jiffies */
58 };
59
60 struct mlx5_tc_ct_priv;
61 struct mlx5_tc_int_port_priv;
62 struct mlx5e_rep_bond;
63 struct mlx5e_tc_tun_encap;
64 struct mlx5e_post_act;
65 struct mlx5e_flow_meters;
66
67 struct mlx5_rep_uplink_priv {
68 /* indirect block callbacks are invoked on bind/unbind events
69 * on registered higher level devices (e.g. tunnel devices)
70 *
71 * tc_indr_block_cb_priv_list is used to lookup indirect callback
72 * private data
73 *
74 */
75 struct list_head tc_indr_block_priv_list;
76
77 struct mlx5_tun_entropy tun_entropy;
78
79 /* protects unready_flows */
80 struct mutex unready_flows_lock;
81 struct list_head unready_flows;
82 struct work_struct reoffload_flows_work;
83
84 /* maps tun_info to a unique id*/
85 struct mapping_ctx *tunnel_mapping;
86 /* maps tun_enc_opts to a unique id*/
87 struct mapping_ctx *tunnel_enc_opts_mapping;
88
89 struct mlx5e_post_act *post_act;
90 struct mlx5_tc_ct_priv *ct_priv;
91 struct mlx5e_tc_psample *tc_psample;
92
93 /* support eswitch vports bonding */
94 struct mlx5e_rep_bond *bond;
95
96 /* tc tunneling encapsulation private data */
97 struct mlx5e_tc_tun_encap *encap;
98
99 /* OVS internal port support */
100 struct mlx5e_tc_int_port_priv *int_port_priv;
101
102 struct mlx5e_flow_meters *flow_meters;
103
104 /* tc action stats */
105 struct mlx5e_tc_act_stats_handle *action_stats_handle;
106
107 struct work_struct mpesw_work;
108 };
109
110 struct mlx5e_rep_priv {
111 struct mlx5_eswitch_rep *rep;
112 struct mlx5e_neigh_update_table neigh_update;
113 struct net_device *netdev;
114 struct mlx5_flow_table *root_ft;
115 struct mlx5_flow_handle *vport_rx_rule;
116 struct list_head vport_sqs_list;
117 struct mlx5_rep_uplink_priv uplink_priv; /* valid for uplink rep */
118 struct rtnl_link_stats64 prev_vf_vport_stats;
119 struct mlx5_flow_handle *send_to_vport_meta_rule;
120 struct rhashtable tc_ht;
121 struct devlink_health_reporter *rep_vnic_reporter;
122 };
123
124 static inline
mlx5e_rep_to_rep_priv(struct mlx5_eswitch_rep * rep)125 struct mlx5e_rep_priv *mlx5e_rep_to_rep_priv(struct mlx5_eswitch_rep *rep)
126 {
127 return rep->rep_data[REP_ETH].priv;
128 }
129
130 struct mlx5e_neigh {
131 union {
132 __be32 v4;
133 struct in6_addr v6;
134 } dst_ip;
135 int family;
136 };
137
138 struct mlx5e_neigh_hash_entry {
139 struct rhash_head rhash_node;
140 struct mlx5e_neigh m_neigh;
141 struct mlx5e_priv *priv;
142 struct net_device *neigh_dev;
143
144 /* Save the neigh hash entry in a list on the representor in
145 * addition to the hash table. In order to iterate easily over the
146 * neighbour entries. Used for stats query.
147 */
148 struct list_head neigh_list;
149
150 /* protects encap list */
151 spinlock_t encap_list_lock;
152 /* encap list sharing the same neigh */
153 struct list_head encap_list;
154
155 /* neigh hash entry can be deleted only when the refcount is zero.
156 * refcount is needed to avoid neigh hash entry removal by TC, while
157 * it's used by the neigh notification call.
158 */
159 refcount_t refcnt;
160
161 /* Save the last reported time offloaded traffic pass over one of the
162 * neigh hash entry flows. Use it to periodically update the neigh
163 * 'used' value and avoid neigh deleting by the kernel.
164 */
165 unsigned long reported_lastuse;
166
167 struct rcu_head rcu;
168 };
169
170 enum {
171 /* set when the encap entry is successfully offloaded into HW */
172 MLX5_ENCAP_ENTRY_VALID = BIT(0),
173 MLX5_REFORMAT_DECAP = BIT(1),
174 MLX5_ENCAP_ENTRY_NO_ROUTE = BIT(2),
175 };
176
177 struct mlx5e_decap_key {
178 struct ethhdr key;
179 };
180
181 struct mlx5e_decap_entry {
182 struct mlx5e_decap_key key;
183 struct list_head flows;
184 struct hlist_node hlist;
185 refcount_t refcnt;
186 struct completion res_ready;
187 int compl_result;
188 struct mlx5_pkt_reformat *pkt_reformat;
189 struct rcu_head rcu;
190 };
191
192 struct mlx5e_mpls_info {
193 u32 label;
194 u8 tc;
195 u8 bos;
196 u8 ttl;
197 };
198
199 struct mlx5e_encap_entry {
200 /* attached neigh hash entry */
201 struct mlx5e_neigh_hash_entry *nhe;
202 /* neigh hash entry list of encaps sharing the same neigh */
203 struct list_head encap_list;
204 /* a node of the eswitch encap hash table which keeping all the encap
205 * entries
206 */
207 struct hlist_node encap_hlist;
208 struct list_head flows;
209 struct list_head route_list;
210 struct mlx5_pkt_reformat *pkt_reformat;
211 const struct ip_tunnel_info *tun_info;
212 struct mlx5e_mpls_info mpls_info;
213 unsigned char h_dest[ETH_ALEN]; /* destination eth addr */
214
215 struct net_device *out_dev;
216 int route_dev_ifindex;
217 struct mlx5e_tc_tunnel *tunnel;
218 int reformat_type;
219 u8 flags;
220 char *encap_header;
221 int encap_size;
222 refcount_t refcnt;
223 struct completion res_ready;
224 int compl_result;
225 struct rcu_head rcu;
226 };
227
228 struct mlx5e_rep_sq_peer {
229 struct mlx5_flow_handle *rule;
230 void *peer;
231 };
232
233 struct mlx5e_rep_sq {
234 struct mlx5_flow_handle *send_to_vport_rule;
235 struct xarray sq_peer;
236 u32 sqn;
237 struct list_head list;
238 };
239
240 int mlx5e_rep_init(void);
241 void mlx5e_rep_cleanup(void);
242 int mlx5e_rep_bond_init(struct mlx5e_rep_priv *rpriv);
243 void mlx5e_rep_bond_cleanup(struct mlx5e_rep_priv *rpriv);
244 int mlx5e_rep_bond_enslave(struct mlx5_eswitch *esw, struct net_device *netdev,
245 struct net_device *lag_dev);
246 void mlx5e_rep_bond_unslave(struct mlx5_eswitch *esw,
247 const struct net_device *netdev,
248 const struct net_device *lag_dev);
249 int mlx5e_rep_bond_update(struct mlx5e_priv *priv, bool cleanup);
250
251 bool mlx5e_rep_has_offload_stats(const struct net_device *dev, int attr_id);
252 int mlx5e_rep_get_offload_stats(int attr_id, const struct net_device *dev,
253 void *sp);
254
255 bool mlx5e_is_uplink_rep(struct mlx5e_priv *priv);
256 void mlx5e_rep_activate_channels(struct mlx5e_priv *priv);
257 void mlx5e_rep_deactivate_channels(struct mlx5e_priv *priv);
258
259 void mlx5e_rep_queue_neigh_stats_work(struct mlx5e_priv *priv);
260
261 bool mlx5e_eswitch_vf_rep(const struct net_device *netdev);
262 bool mlx5e_eswitch_uplink_rep(const struct net_device *netdev);
mlx5e_eswitch_rep(const struct net_device * netdev)263 static inline bool mlx5e_eswitch_rep(const struct net_device *netdev)
264 {
265 return mlx5e_eswitch_vf_rep(netdev) ||
266 mlx5e_eswitch_uplink_rep(netdev);
267 }
268
269 #else /* CONFIG_MLX5_ESWITCH */
mlx5e_is_uplink_rep(struct mlx5e_priv * priv)270 static inline bool mlx5e_is_uplink_rep(struct mlx5e_priv *priv) { return false; }
mlx5e_rep_activate_channels(struct mlx5e_priv * priv)271 static inline void mlx5e_rep_activate_channels(struct mlx5e_priv *priv) {}
mlx5e_rep_deactivate_channels(struct mlx5e_priv * priv)272 static inline void mlx5e_rep_deactivate_channels(struct mlx5e_priv *priv) {}
mlx5e_rep_init(void)273 static inline int mlx5e_rep_init(void) { return 0; };
mlx5e_rep_cleanup(void)274 static inline void mlx5e_rep_cleanup(void) {};
mlx5e_rep_has_offload_stats(const struct net_device * dev,int attr_id)275 static inline bool mlx5e_rep_has_offload_stats(const struct net_device *dev,
276 int attr_id) { return false; }
mlx5e_rep_get_offload_stats(int attr_id,const struct net_device * dev,void * sp)277 static inline int mlx5e_rep_get_offload_stats(int attr_id,
278 const struct net_device *dev,
279 void *sp) { return -EOPNOTSUPP; }
280 #endif
281
mlx5e_is_vport_rep(struct mlx5e_priv * priv)282 static inline bool mlx5e_is_vport_rep(struct mlx5e_priv *priv)
283 {
284 return (MLX5_ESWITCH_MANAGER(priv->mdev) && priv->ppriv);
285 }
286 #endif /* __MLX5E_REP_H__ */
287