2016-08-04 16:13:09 +01:00
|
|
|
/*
|
|
|
|
|
* Copyright (c) 2016 Cisco and/or its affiliates.
|
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
|
* You may obtain a copy of the License at:
|
|
|
|
|
*
|
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
*
|
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
|
* limitations under the License.
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* lb-plugin implements a MagLev-like load balancer.
|
|
|
|
|
* http://research.google.com/pubs/pub44824.html
|
|
|
|
|
*
|
|
|
|
|
* It hasn't been tested for interoperability with the original MagLev
|
|
|
|
|
* but intends to provide similar functionality.
|
|
|
|
|
* The load-balancer receives traffic destined to VIP (Virtual IP)
|
|
|
|
|
* addresses from one or multiple(ECMP) routers.
|
|
|
|
|
* The load-balancer tunnels the traffic toward many application servers
|
|
|
|
|
* ensuring session stickyness (i.e. that a single sessions is tunneled
|
|
|
|
|
* towards a single application server).
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
#ifndef LB_PLUGIN_LB_LB_H_
|
|
|
|
|
#define LB_PLUGIN_LB_LB_H_
|
|
|
|
|
|
|
|
|
|
#include <lb/util.h>
|
2017-11-13 20:34:06 +08:00
|
|
|
#include <vnet/util/refcount.h>
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
#include <vnet/vnet.h>
|
|
|
|
|
#include <vnet/ip/ip.h>
|
2016-10-05 09:38:21 +01:00
|
|
|
#include <vnet/dpo/dpo.h>
|
|
|
|
|
#include <vnet/fib/fib_table.h>
|
2018-01-23 19:17:23 +08:00
|
|
|
#include <vppinfra/hash.h>
|
2018-02-06 23:00:22 +08:00
|
|
|
#include <vppinfra/bihash_8_8.h>
|
|
|
|
|
#include <vppinfra/bihash_24_8.h>
|
2016-08-04 16:13:09 +01:00
|
|
|
#include <lb/lbhash.h>
|
|
|
|
|
|
|
|
|
|
#define LB_DEFAULT_PER_CPU_STICKY_BUCKETS 1 << 10
|
|
|
|
|
#define LB_DEFAULT_FLOW_TIMEOUT 40
|
2018-02-06 23:00:22 +08:00
|
|
|
#define LB_MAPPING_BUCKETS 1024
|
|
|
|
|
#define LB_MAPPING_MEMORY_SIZE 64<<20
|
2016-08-04 16:13:09 +01:00
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
#define LB_VIP_PER_PORT_BUCKETS 1024
|
|
|
|
|
#define LB_VIP_PER_PORT_MEMORY_SIZE 64<<20
|
|
|
|
|
|
2016-10-05 09:38:21 +01:00
|
|
|
typedef enum {
|
|
|
|
|
LB_NEXT_DROP,
|
|
|
|
|
LB_N_NEXT,
|
|
|
|
|
} lb_next_t;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
typedef enum {
|
|
|
|
|
LB_NAT4_IN2OUT_NEXT_DROP,
|
|
|
|
|
LB_NAT4_IN2OUT_NEXT_LOOKUP,
|
|
|
|
|
LB_NAT4_IN2OUT_N_NEXT,
|
|
|
|
|
} LB_nat4_in2out_next_t;
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB_NAT6_IN2OUT_NEXT_DROP,
|
|
|
|
|
LB_NAT6_IN2OUT_NEXT_LOOKUP,
|
|
|
|
|
LB_NAT6_IN2OUT_N_NEXT,
|
|
|
|
|
} LB_nat6_in2out_next_t;
|
|
|
|
|
|
|
|
|
|
#define foreach_lb_nat_in2out_error \
|
|
|
|
|
_(UNSUPPORTED_PROTOCOL, "Unsupported protocol") \
|
|
|
|
|
_(IN2OUT_PACKETS, "Good in2out packets processed") \
|
|
|
|
|
_(NO_TRANSLATION, "No translation")
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
#define _(sym,str) LB_NAT_IN2OUT_ERROR_##sym,
|
|
|
|
|
foreach_lb_nat_in2out_error
|
|
|
|
|
#undef _
|
|
|
|
|
LB_NAT_IN2OUT_N_ERROR,
|
|
|
|
|
} lb_nat_in2out_error_t;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* lb for kube-proxy supports three types of service
|
|
|
|
|
*/
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB_SRV_TYPE_CLUSTERIP,
|
|
|
|
|
LB_SRV_TYPE_NODEPORT,
|
|
|
|
|
LB_SRV_N_TYPES,
|
|
|
|
|
} lb_svr_type_t;
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB4_NODEPORT_NEXT_IP4_NAT4,
|
|
|
|
|
LB4_NODEPORT_NEXT_DROP,
|
|
|
|
|
LB4_NODEPORT_N_NEXT,
|
|
|
|
|
} lb4_nodeport_next_t;
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB6_NODEPORT_NEXT_IP6_NAT6,
|
|
|
|
|
LB6_NODEPORT_NEXT_DROP,
|
|
|
|
|
LB6_NODEPORT_N_NEXT,
|
|
|
|
|
} lb6_nodeport_next_t;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* Each VIP is configured with a set of
|
|
|
|
|
* application server.
|
|
|
|
|
*/
|
|
|
|
|
typedef struct {
|
2016-10-05 09:38:21 +01:00
|
|
|
/**
|
|
|
|
|
* Registration to FIB event.
|
|
|
|
|
*/
|
|
|
|
|
fib_node_t fib_node;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* Destination address used to tunnel traffic towards
|
|
|
|
|
* that application server.
|
|
|
|
|
* The address is also used as ID and pseudo-random
|
|
|
|
|
* seed for the load-balancing process.
|
|
|
|
|
*/
|
|
|
|
|
ip46_address_t address;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* ASs are indexed by address and VIP Index.
|
|
|
|
|
* Which means there will be duplicated if the same server
|
|
|
|
|
* address is used for multiple VIPs.
|
|
|
|
|
*/
|
|
|
|
|
u32 vip_index;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Some per-AS flags.
|
|
|
|
|
* For now only LB_AS_FLAGS_USED is defined.
|
|
|
|
|
*/
|
|
|
|
|
u8 flags;
|
|
|
|
|
|
|
|
|
|
#define LB_AS_FLAGS_USED 0x1
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Rotating timestamp of when LB_AS_FLAGS_USED flag was last set.
|
|
|
|
|
*
|
|
|
|
|
* AS removal is based on garbage collection and reference counting.
|
|
|
|
|
* When an AS is removed, there is a race between configuration core
|
|
|
|
|
* and worker cores which may still add a reference while it should not
|
|
|
|
|
* be used. This timestamp is used to not remove the AS while a race condition
|
|
|
|
|
* may happen.
|
|
|
|
|
*/
|
|
|
|
|
u32 last_used;
|
2016-10-05 09:38:21 +01:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The FIB entry index for the next-hop
|
|
|
|
|
*/
|
|
|
|
|
fib_node_index_t next_hop_fib_entry_index;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The child index on the FIB entry
|
|
|
|
|
*/
|
|
|
|
|
u32 next_hop_child_index;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The next DPO in the graph to follow.
|
|
|
|
|
*/
|
|
|
|
|
dpo_id_t dpo;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
} lb_as_t;
|
|
|
|
|
|
|
|
|
|
format_function_t format_lb_as;
|
|
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
|
u32 as_index;
|
|
|
|
|
} lb_new_flow_entry_t;
|
|
|
|
|
|
|
|
|
|
#define lb_foreach_vip_counter \
|
2016-10-13 13:36:18 +01:00
|
|
|
_(NEXT_PACKET, "packet from existing sessions", 0) \
|
|
|
|
|
_(FIRST_PACKET, "first session packet", 1) \
|
|
|
|
|
_(UNTRACKED_PACKET, "untracked packet", 2) \
|
|
|
|
|
_(NO_SERVER, "no server configured", 3)
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
#define _(a,b,c) LB_VIP_COUNTER_##a = c,
|
|
|
|
|
lb_foreach_vip_counter
|
|
|
|
|
#undef _
|
|
|
|
|
LB_N_VIP_COUNTERS
|
|
|
|
|
} lb_vip_counter_t;
|
|
|
|
|
|
2018-01-23 19:17:23 +08:00
|
|
|
typedef enum {
|
|
|
|
|
LB_ENCAP_TYPE_GRE4,
|
|
|
|
|
LB_ENCAP_TYPE_GRE6,
|
|
|
|
|
LB_ENCAP_TYPE_L3DSR,
|
2018-02-06 23:00:22 +08:00
|
|
|
LB_ENCAP_TYPE_NAT4,
|
|
|
|
|
LB_ENCAP_TYPE_NAT6,
|
2018-01-23 19:17:23 +08:00
|
|
|
LB_ENCAP_N_TYPES,
|
|
|
|
|
} lb_encap_type_t;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
/**
|
|
|
|
|
* Lookup type
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB_LKP_SAME_IP_PORT,
|
|
|
|
|
LB_LKP_DIFF_IP_PORT,
|
|
|
|
|
LB_LKP_ALL_PORT_IP,
|
|
|
|
|
LB_LKP_N_TYPES,
|
|
|
|
|
} lb_lkp_type_t;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* The load balancer supports IPv4 and IPv6 traffic
|
2018-02-06 23:00:22 +08:00
|
|
|
* and GRE4, GRE6, L3DSR and NAT4, NAT6 encap.
|
2016-08-04 16:13:09 +01:00
|
|
|
*/
|
|
|
|
|
typedef enum {
|
|
|
|
|
LB_VIP_TYPE_IP6_GRE6,
|
|
|
|
|
LB_VIP_TYPE_IP6_GRE4,
|
|
|
|
|
LB_VIP_TYPE_IP4_GRE6,
|
|
|
|
|
LB_VIP_TYPE_IP4_GRE4,
|
2018-01-23 19:17:23 +08:00
|
|
|
LB_VIP_TYPE_IP4_L3DSR,
|
2018-02-06 23:00:22 +08:00
|
|
|
LB_VIP_TYPE_IP4_NAT4,
|
|
|
|
|
LB_VIP_TYPE_IP6_NAT6,
|
2016-08-04 16:13:09 +01:00
|
|
|
LB_VIP_N_TYPES,
|
|
|
|
|
} lb_vip_type_t;
|
|
|
|
|
|
|
|
|
|
format_function_t format_lb_vip_type;
|
|
|
|
|
unformat_function_t unformat_lb_vip_type;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
|
|
|
|
|
/* args for different vip encap types */
|
|
|
|
|
typedef struct {
|
|
|
|
|
union
|
|
|
|
|
{
|
|
|
|
|
struct
|
|
|
|
|
{
|
|
|
|
|
/* Service type. clusterip or nodeport */
|
|
|
|
|
u8 srv_type;
|
|
|
|
|
|
|
|
|
|
/* Pod's port corresponding to specific service. network byte order */
|
|
|
|
|
u16 target_port;
|
|
|
|
|
};
|
|
|
|
|
/* DSCP bits for L3DSR */
|
|
|
|
|
u8 dscp;
|
|
|
|
|
u64 as_u64;
|
|
|
|
|
};
|
|
|
|
|
} lb_vip_encap_args_t;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
typedef struct {
|
|
|
|
|
/* all fields in NET byte order */
|
|
|
|
|
union {
|
|
|
|
|
struct {
|
|
|
|
|
u32 vip_prefix_index;
|
|
|
|
|
u16 port;
|
|
|
|
|
u8 protocol;
|
|
|
|
|
u8 rsv;
|
|
|
|
|
};
|
|
|
|
|
u64 as_u64;
|
|
|
|
|
};
|
|
|
|
|
} vip_port_key_t;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
2018-06-28 20:14:19 +08:00
|
|
|
* Load balancing service is provided per VIP+protocol+port.
|
2016-08-04 16:13:09 +01:00
|
|
|
* In this data model, a VIP can be a whole prefix.
|
|
|
|
|
* But load balancing only
|
|
|
|
|
* occurs on a per-source-address/port basis. Meaning that if a given source
|
|
|
|
|
* reuses the same port for multiple destinations within the same VIP,
|
|
|
|
|
* they will be considered as a single flow.
|
|
|
|
|
*/
|
|
|
|
|
typedef struct {
|
|
|
|
|
|
|
|
|
|
//Runtime
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Vector mapping (flow-hash & new_connect_table_mask) to AS index.
|
|
|
|
|
* This is used for new flows.
|
|
|
|
|
*/
|
|
|
|
|
lb_new_flow_entry_t *new_flow_table;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* New flows table length - 1
|
|
|
|
|
* (length MUST be a power of 2)
|
|
|
|
|
*/
|
|
|
|
|
u32 new_flow_table_mask;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Last time garbage collection was run to free the ASs.
|
|
|
|
|
*/
|
|
|
|
|
u32 last_garbage_collection;
|
|
|
|
|
|
|
|
|
|
//Not runtime
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* A Virtual IP represents a given service delivered
|
|
|
|
|
* by a set of application servers. It can be a single
|
|
|
|
|
* address or a prefix.
|
|
|
|
|
* IPv4 prefixes are encoded using IPv4-in-IPv6 embedded address
|
|
|
|
|
* (i.e. ::/96 prefix).
|
|
|
|
|
*/
|
|
|
|
|
ip46_address_t prefix;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The VIP prefix length.
|
|
|
|
|
* In case of IPv4, plen = 96 + ip4_plen.
|
|
|
|
|
*/
|
|
|
|
|
u8 plen;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
/* tcp or udp. If not per-port vip, set to ~0 */
|
|
|
|
|
u8 protocol;
|
|
|
|
|
|
|
|
|
|
/* tcp port or udp port. If not per-port vip, set to ~0 */
|
|
|
|
|
u16 port;
|
|
|
|
|
|
|
|
|
|
/* Valid for per-port vip */
|
|
|
|
|
u32 vip_prefix_index;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* The type of traffic for this.
|
|
|
|
|
* LB_TYPE_UNDEFINED if unknown.
|
|
|
|
|
*/
|
|
|
|
|
lb_vip_type_t type;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
/* args for different vip encap types */
|
|
|
|
|
lb_vip_encap_args_t encap_args;
|
2018-01-23 19:17:23 +08:00
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* Flags related to this VIP.
|
|
|
|
|
* LB_VIP_FLAGS_USED means the VIP is active.
|
|
|
|
|
* When it is not set, the VIP in the process of being removed.
|
|
|
|
|
* We cannot immediately remove a VIP because the VIP index still may be stored
|
|
|
|
|
* in the adjacency index.
|
|
|
|
|
*/
|
|
|
|
|
u8 flags;
|
2016-10-05 09:38:21 +01:00
|
|
|
#define LB_VIP_FLAGS_USED 0x1
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Pool of AS indexes used for this VIP.
|
|
|
|
|
* This also includes ASs that have been removed (but are still referenced).
|
|
|
|
|
*/
|
|
|
|
|
u32 *as_indexes;
|
|
|
|
|
} lb_vip_t;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
#define lb_vip_is_ip4(type) (type == LB_VIP_TYPE_IP4_GRE6 \
|
|
|
|
|
|| type == LB_VIP_TYPE_IP4_GRE4 \
|
|
|
|
|
|| type == LB_VIP_TYPE_IP4_L3DSR \
|
|
|
|
|
|| type == LB_VIP_TYPE_IP4_NAT4 )
|
2018-02-06 23:00:22 +08:00
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
#define lb_vip_is_ip6(type) (type == LB_VIP_TYPE_IP6_GRE6 \
|
|
|
|
|
|| type == LB_VIP_TYPE_IP6_GRE4 \
|
|
|
|
|
|| type == LB_VIP_TYPE_IP6_NAT6 )
|
2018-02-06 23:00:22 +08:00
|
|
|
|
2018-01-23 19:17:23 +08:00
|
|
|
#define lb_encap_is_ip4(vip) ((vip)->type == LB_VIP_TYPE_IP6_GRE4 \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_GRE4 \
|
2018-02-06 23:00:22 +08:00
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_L3DSR \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_NAT4 )
|
2018-01-23 19:17:23 +08:00
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
#define lb_vip_is_gre4(vip) (((vip)->type == LB_VIP_TYPE_IP6_GRE4 \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_GRE4) \
|
|
|
|
|
&& ((vip)->port == 0))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#define lb_vip_is_gre6(vip) (((vip)->type == LB_VIP_TYPE_IP6_GRE6 \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_GRE6) \
|
|
|
|
|
&& ((vip)->port == 0))
|
|
|
|
|
|
|
|
|
|
#define lb_vip_is_gre4_port(vip) (((vip)->type == LB_VIP_TYPE_IP6_GRE4 \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_GRE4) \
|
|
|
|
|
&& ((vip)->port != 0))
|
|
|
|
|
|
|
|
|
|
#define lb_vip_is_gre6_port(vip) (((vip)->type == LB_VIP_TYPE_IP6_GRE6 \
|
|
|
|
|
|| (vip)->type == LB_VIP_TYPE_IP4_GRE6) \
|
|
|
|
|
&& ((vip)->port != 0))
|
|
|
|
|
|
2018-06-11 11:40:17 -05:00
|
|
|
always_inline bool
|
|
|
|
|
lb_vip_is_l3dsr(const lb_vip_t *vip)
|
|
|
|
|
{
|
2018-06-28 20:14:19 +08:00
|
|
|
return (vip->type == LB_VIP_TYPE_IP4_L3DSR && vip->port ==0);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
always_inline bool
|
|
|
|
|
lb_vip_is_l3dsr_port(const lb_vip_t *vip)
|
|
|
|
|
{
|
|
|
|
|
return (vip->type == LB_VIP_TYPE_IP4_L3DSR && vip->port !=0);
|
2018-06-11 11:40:17 -05:00
|
|
|
}
|
|
|
|
|
always_inline bool
|
2018-06-28 20:14:19 +08:00
|
|
|
lb_vip_is_nat4_port(const lb_vip_t *vip)
|
2018-06-11 11:40:17 -05:00
|
|
|
{
|
2018-06-28 20:14:19 +08:00
|
|
|
return (vip->type == LB_VIP_TYPE_IP4_NAT4 && vip->port !=0);
|
2018-06-11 11:40:17 -05:00
|
|
|
}
|
|
|
|
|
always_inline bool
|
2018-06-28 20:14:19 +08:00
|
|
|
lb_vip_is_nat6_port(const lb_vip_t *vip)
|
2018-06-11 11:40:17 -05:00
|
|
|
{
|
2018-06-28 20:14:19 +08:00
|
|
|
return (vip->type == LB_VIP_TYPE_IP6_NAT6 && vip->port !=0);
|
2018-06-11 11:40:17 -05:00
|
|
|
}
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
format_function_t format_lb_vip;
|
|
|
|
|
format_function_t format_lb_vip_detailed;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
#define foreach_lb_nat_protocol \
|
|
|
|
|
_(UDP, 0, udp, "udp") \
|
|
|
|
|
_(TCP, 1, tcp, "tcp")
|
|
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
|
#define _(N, i, n, s) LB_NAT_PROTOCOL_##N = i,
|
|
|
|
|
foreach_lb_nat_protocol
|
|
|
|
|
#undef _
|
|
|
|
|
} lb_nat_protocol_t;
|
|
|
|
|
|
|
|
|
|
always_inline u32
|
|
|
|
|
lb_ip_proto_to_nat_proto (u8 ip_proto)
|
|
|
|
|
{
|
|
|
|
|
u32 nat_proto = ~0;
|
|
|
|
|
|
|
|
|
|
nat_proto = (ip_proto == IP_PROTOCOL_UDP) ? LB_NAT_PROTOCOL_UDP : nat_proto;
|
|
|
|
|
nat_proto = (ip_proto == IP_PROTOCOL_TCP) ? LB_NAT_PROTOCOL_TCP : nat_proto;
|
|
|
|
|
|
|
|
|
|
return nat_proto;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Key for Pod's egress SNAT */
|
|
|
|
|
typedef struct {
|
|
|
|
|
union
|
|
|
|
|
{
|
|
|
|
|
struct
|
|
|
|
|
{
|
|
|
|
|
ip4_address_t addr;
|
|
|
|
|
u16 port;
|
|
|
|
|
u16 protocol:3,
|
|
|
|
|
fib_index:13;
|
|
|
|
|
};
|
|
|
|
|
u64 as_u64;
|
|
|
|
|
};
|
|
|
|
|
} lb_snat4_key_t;
|
|
|
|
|
|
|
|
|
|
typedef struct
|
|
|
|
|
{
|
|
|
|
|
union
|
|
|
|
|
{
|
|
|
|
|
struct
|
|
|
|
|
{
|
|
|
|
|
ip6_address_t addr;
|
|
|
|
|
u16 port;
|
|
|
|
|
u16 protocol;
|
|
|
|
|
u32 fib_index;
|
|
|
|
|
};
|
|
|
|
|
u64 as_u64[3];
|
|
|
|
|
};
|
|
|
|
|
} lb_snat6_key_t;
|
|
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
|
/**
|
|
|
|
|
* for vip + port case, src_ip = vip;
|
|
|
|
|
* for node ip + node_port, src_ip = node_ip
|
|
|
|
|
*/
|
|
|
|
|
ip46_address_t src_ip;
|
|
|
|
|
ip46_address_t as_ip;
|
|
|
|
|
u8 src_ip_is_ipv6;
|
|
|
|
|
u8 as_ip_is_ipv6;
|
|
|
|
|
/**
|
|
|
|
|
* Network byte order
|
|
|
|
|
* for vip + port case, src_port = port;
|
|
|
|
|
* for node ip + node_port, src_port = node_port
|
|
|
|
|
*/
|
|
|
|
|
u16 src_port;
|
|
|
|
|
u16 target_port; /* Network byte order */
|
|
|
|
|
u32 vrf_id;
|
|
|
|
|
u32 fib_index;
|
|
|
|
|
} lb_snat_mapping_t;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
typedef struct {
|
|
|
|
|
/**
|
|
|
|
|
* Each CPU has its own sticky flow hash table.
|
|
|
|
|
* One single table is used for all VIPs.
|
|
|
|
|
*/
|
|
|
|
|
lb_hash_t *sticky_ht;
|
|
|
|
|
} lb_per_cpu_t;
|
|
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
|
/**
|
|
|
|
|
* Pool of all Virtual IPs
|
|
|
|
|
*/
|
|
|
|
|
lb_vip_t *vips;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
/**
|
|
|
|
|
* bitmap for vip prefix to support per-port vip
|
|
|
|
|
*/
|
|
|
|
|
uword *vip_prefix_indexes;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* Pool of ASs.
|
|
|
|
|
* ASs are referenced by address and vip index.
|
|
|
|
|
* The first element (index 0) is special and used only to fill
|
|
|
|
|
* new_flow_tables when no AS has been configured.
|
|
|
|
|
*/
|
|
|
|
|
lb_as_t *ass;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Each AS has an associated reference counter.
|
|
|
|
|
* As ass[0] has a special meaning, its associated counter
|
|
|
|
|
* starts at 0 and is decremented instead. i.e. do not use it.
|
|
|
|
|
*/
|
|
|
|
|
vlib_refcount_t as_refcount;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
/* hash lookup vip_index by key: {u16: nodeport} */
|
|
|
|
|
uword * vip_index_by_nodeport;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* Some global data is per-cpu
|
|
|
|
|
*/
|
|
|
|
|
lb_per_cpu_t *per_cpu;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Node next index for IP adjacencies, for each of the traffic types.
|
|
|
|
|
*/
|
|
|
|
|
u32 ip_lookup_next_index[LB_VIP_N_TYPES];
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Source address used in IPv6 encapsulated traffic
|
|
|
|
|
*/
|
|
|
|
|
ip6_address_t ip6_src_address;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Source address used for IPv4 encapsulated traffic
|
|
|
|
|
*/
|
|
|
|
|
ip4_address_t ip4_src_address;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Number of buckets in the per-cpu sticky hash table.
|
|
|
|
|
*/
|
|
|
|
|
u32 per_cpu_sticky_buckets;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Flow timeout in seconds.
|
|
|
|
|
*/
|
|
|
|
|
u32 flow_timeout;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Per VIP counter
|
|
|
|
|
*/
|
|
|
|
|
vlib_simple_counter_main_t vip_counters[LB_N_VIP_COUNTERS];
|
|
|
|
|
|
2016-10-05 09:38:21 +01:00
|
|
|
/**
|
|
|
|
|
* DPO used to send packet from IP4/6 lookup to LB node.
|
|
|
|
|
*/
|
|
|
|
|
dpo_type_t dpo_gre4_type;
|
|
|
|
|
dpo_type_t dpo_gre6_type;
|
2018-06-28 20:14:19 +08:00
|
|
|
dpo_type_t dpo_gre4_port_type;
|
|
|
|
|
dpo_type_t dpo_gre6_port_type;
|
2018-01-23 19:17:23 +08:00
|
|
|
dpo_type_t dpo_l3dsr_type;
|
2018-06-28 20:14:19 +08:00
|
|
|
dpo_type_t dpo_l3dsr_port_type;
|
|
|
|
|
dpo_type_t dpo_nat4_port_type;
|
|
|
|
|
dpo_type_t dpo_nat6_port_type;
|
2016-10-05 09:38:21 +01:00
|
|
|
/**
|
|
|
|
|
* Node type for registering to fib changes.
|
|
|
|
|
*/
|
|
|
|
|
fib_node_type_t fib_node_type;
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
/* lookup per_port vip by key */
|
|
|
|
|
clib_bihash_8_8_t vip_index_per_port;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
/* Find a static mapping by AS IP : target_port */
|
|
|
|
|
clib_bihash_8_8_t mapping_by_as4;
|
|
|
|
|
clib_bihash_24_8_t mapping_by_as6;
|
|
|
|
|
|
|
|
|
|
/* Static mapping pool */
|
|
|
|
|
lb_snat_mapping_t * snat_mappings;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
/**
|
|
|
|
|
* API dynamically registered base ID.
|
|
|
|
|
*/
|
|
|
|
|
u16 msg_id_base;
|
|
|
|
|
|
|
|
|
|
volatile u32 *writer_lock;
|
2018-02-06 23:00:22 +08:00
|
|
|
|
|
|
|
|
/* convenience */
|
|
|
|
|
vlib_main_t *vlib_main;
|
|
|
|
|
vnet_main_t *vnet_main;
|
2016-08-04 16:13:09 +01:00
|
|
|
} lb_main_t;
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
/* args for different vip encap types */
|
|
|
|
|
typedef struct {
|
|
|
|
|
ip46_address_t prefix;
|
|
|
|
|
u8 plen;
|
2018-06-28 20:14:19 +08:00
|
|
|
u8 protocol;
|
|
|
|
|
u16 port;
|
2018-02-06 23:00:22 +08:00
|
|
|
lb_vip_type_t type;
|
|
|
|
|
u32 new_length;
|
|
|
|
|
lb_vip_encap_args_t encap_args;
|
|
|
|
|
} lb_vip_add_args_t;
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
extern lb_main_t lb_main;
|
|
|
|
|
extern vlib_node_registration_t lb4_node;
|
2018-02-06 23:00:22 +08:00
|
|
|
extern vlib_node_registration_t lb6_node;
|
|
|
|
|
extern vlib_node_registration_t lb4_nodeport_node;
|
|
|
|
|
extern vlib_node_registration_t lb6_nodeport_node;
|
|
|
|
|
extern vlib_node_registration_t lb_nat4_in2out_node;
|
|
|
|
|
extern vlib_node_registration_t lb_nat6_in2out_node;
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Fix global load-balancer parameters.
|
|
|
|
|
* @param ip4_address IPv4 source address used for encapsulated traffic
|
|
|
|
|
* @param ip6_address IPv6 source address used for encapsulated traffic
|
|
|
|
|
* @return 0 on success. VNET_LB_ERR_XXX on error
|
|
|
|
|
*/
|
|
|
|
|
int lb_conf(ip4_address_t *ip4_address, ip6_address_t *ip6_address,
|
|
|
|
|
u32 sticky_buckets, u32 flow_timeout);
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
int lb_vip_add(lb_vip_add_args_t args, u32 *vip_index);
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
int lb_vip_del(u32 vip_index);
|
|
|
|
|
|
2018-06-28 20:14:19 +08:00
|
|
|
int lb_vip_find_index(ip46_address_t *prefix, u8 plen, u8 protocol,
|
|
|
|
|
u16 port, u32 *vip_index);
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
#define lb_vip_get_by_index(index) (pool_is_free_index(lb_main.vips, index)?NULL:pool_elt_at_index(lb_main.vips, index))
|
|
|
|
|
|
|
|
|
|
int lb_vip_add_ass(u32 vip_index, ip46_address_t *addresses, u32 n);
|
2018-08-22 20:21:19 +08:00
|
|
|
int lb_vip_del_ass(u32 vip_index, ip46_address_t *addresses, u32 n, u8 flush);
|
2018-09-18 23:25:02 +08:00
|
|
|
int lb_flush_vip_as (u32 vip_index, u32 as_index);
|
2016-08-04 16:13:09 +01:00
|
|
|
|
|
|
|
|
u32 lb_hash_time_now(vlib_main_t * vm);
|
|
|
|
|
|
|
|
|
|
void lb_garbage_collection();
|
|
|
|
|
|
2018-02-06 23:00:22 +08:00
|
|
|
int lb_nat4_interface_add_del (u32 sw_if_index, int is_del);
|
|
|
|
|
int lb_nat6_interface_add_del (u32 sw_if_index, int is_del);
|
|
|
|
|
|
2016-08-04 16:13:09 +01:00
|
|
|
format_function_t format_lb_main;
|
|
|
|
|
|
|
|
|
|
#endif /* LB_PLUGIN_LB_LB_H_ */
|