bridget/bridget.sh

323 lines
9.3 KiB
Bash

#!/bin/sh
CNI_CONFIG="${CNI_CONFIG:-/etc/cni/net.d/10-bridget.conf}"
usage() {
cat <<EOF
Available variables:
- BRIDGE (example: cbr0)
- VLAN (example: 100)
- IFACE (example: eth0)
- MTU (default: 1500)
- CHECK_SLAVES (example: 1)
- POD_NETWORK (default: 10.244.0.0/16)
- DIVISION_PREFIX (default: 24)"
- ARP_PACKETS (default: 4)
- DEBUG (example: 1)
Short workflow:
* If bridge exists it will be used, if not exist it will be created
* If VLAN and IFACE is set, the next chain will be created:
IFACE <-- VLAN <-- BRIDGE
* If bridge have no IP-address it will be retrived automatically
This IP-address will be used as default gateway for containers
for make possible kubernetes-services.
EOF
}
error() {
>&2 echo -en "[$(date '+%Y-%m-%d %H:%M:%S')] ERROR:\t"
>&2 echo "$1"
>&2 usage
exit 1
}
log() {
echo -en "[$(date '+%Y-%m-%d %H:%M:%S')] INFO:\t"
echo "$1"
}
debug() {
if [ "$DEBUG" == 1 ]; then
>&2 echo -en "[$(date '+%Y-%m-%d %H:%M:%S')] DEBUG:\t"
>&2 echo "$1"
fi
}
next_ip() {
local IP_HEX=$(printf '%.2X%.2X%.2X%.2X\n' `echo $1 | sed -e 's/\./ /g'`)
local NEXT_IP_HEX=$(printf %.8X `echo $(( 0x$IP_HEX + 1 ))`)
local NEXT_IP=$(printf '%d.%d.%d.%d\n' `echo $NEXT_IP_HEX | sed -r 's/(..)/0x\1 /g'`)
echo $NEXT_IP
}
prev_ip() {
local IP_HEX=$(printf '%.2X%.2X%.2X%.2X\n' `echo $1 | sed -e 's/\./ /g'`)
local PREV_IP_HEX=$(printf %.8X `echo $(( 0x$IP_HEX - 1 ))`)
local PREV_IP=$(printf '%d.%d.%d.%d\n' `echo $PREV_IP_HEX | sed -r 's/(..)/0x\1 /g'`)
echo $PREV_IP
}
random_gateway() {
local IFS=
local NETWORKS_NUM="$(echo "$NETWORKS_LIST" | wc -l)"
local RANDOM_NETWORK_NUM="$(shuf -i "1-$NETWORKS_NUM" -n 1)"
local RANDOM_NETWORK="$(echo "$NETWORKS_LIST" | head -n "$RANDOM_NETWORK_NUM" | tail -n 1)"
unset IFS
local RANDOM_GATEWAY="$(next_ip $RANDOM_NETWORK)"
echo "$RANDOM_GATEWAY"
}
address_is_free(){
set +m
ARP_PACKETS=${ARP_PACKETS:-4}
# Start recording packets
tcpdump -nn -i "$BRIDGE" arp host "$1" 1>/dev/null 2>/tmp/tcpdump.out &
# Wait for tcpdump
until [ -f /tmp/tcpdump.out ]; do sleep 0.1; done
# Start arping
local ARPING_CHECK="$(arping -fD -I "$BRIDGE" -s 0.0.0.0 -c 4 "$1" | awk '$1=="Sent" {printf $2 " "} $1=="Received" {print $2}')"
# Kill tcpdump
kill "$!" && wait "$!"
local TCPDUMP_COUNT="$(awk '$3 == "received" {print $1}' /tmp/tcpdump.out)"
local ARPING_COUNT="$(echo "$ARPING_CHECK" | awk '{print $1+$2}')"
local ARPING_SEND="$(echo "$ARPING_CHECK" | awk '{print $1}')"
local ARPING_RECEIVED="$(echo "$ARPING_CHECK" | awk '{print $2}')"
debug "TCPDUMP_COUNT=$TCPDUMP_COUNT"
debug "ARPING_COUNT=$ARPING_COUNT"
debug "ARPING_SEND=$ARPING_SEND"
debug "ARPING_RECEIVED=$ARPING_RECEIVED"
debug "$(cat /tmp/tcpdump.out)"
rm -f /tmp/tcpdump.out
if [ "$ARPING_RECEIVED" == "0" ] && [ "$TCPDUMP_COUNT" == "$ARPING_COUNT" ]; then
debug "[ ARPING_RECEIVED == 0 ] && [ TCPDUMP_COUNT == ARPING_COUNT ]"
return 0
else
debug "[ ARPING_RECEIVED != 0 ] && [ TCPDUMP_COUNT != ARPING_COUNT ]"
return 1
fi
}
gateway_is_right() {
(IFS= echo "$NETWORKS_LIST") | grep -q "$(prev_ip $1)"
}
# ------------------------------------------------------------------------------------
# Configure bridge
# ------------------------------------------------------------------------------------
log "Starting bridge configuration"
[ -z "$BRIDGE" ] && error "BRIDGE variable is not defined"
# Check if bridge interface exist
if ! ip link show "$BRIDGE" &> /dev/null; then
log "Adding new bridge $BRIDGE"
ip link add dev "$BRIDGE" type bridge
export CHECK_SLAVES=1
else
log "Bridge $BRIDGE already exist, use it"
fi
log "Setting bridge $BRIDGE up"
ip link set "$BRIDGE" up
# ------------------------------------------------------------------------------------
# Configure vlan
# ------------------------------------------------------------------------------------
if ([ ! -z "$VLAN" ] || [ ! -z "$IFACE" ]) && [ "$CHECK_SLAVES" == 1 ]; then
log "Starting VLAN configuration"
[ -z "$IFACE" ] && error "IFACE variable is not defined"
if [ ! -z "$VLAN" ]; then
# check if vlan interface exist
if ip link show "$IFACE.$VLAN" &> /dev/null; then
log "VLAN interface $IFACE.$VLAN already exist"
else
log "Adding new VLAN interface $IFACE.$VLAN"
ip link add link "$IFACE" name "$IFACE.$VLAN" type vlan id "$VLAN"
fi
log "Setting vlan $IFACE.$VLAN up"
ip link set dev "$IFACE.$VLAN" up
fi
fi
# ------------------------------------------------------------------------------------
# Configure slaves
# ------------------------------------------------------------------------------------
if ([ ! -z "$VLAN" ] || [ ! -z "$IFACE" ]) && [ "$CHECK_SLAVES" == 1 ]; then
log "Starting configuring slave interfaces"
if [ ! -z "$VLAN" ]; then
SLAVEIF="$IFACE.$VLAN"
else
SLAVEIF="$IFACE"
fi
if ! ip link show "$SLAVEIF" &> /dev/null; then
error "$SLAVEIF does not exist"
fi
# check if slave interface contains right master
MASTERIF="$(ip -o link show "$SLAVEIF" | grep -o -m1 'master [^ ]\+' | cut -d' ' -f2 )"
case "$MASTERIF" in
"$BRIDGE" ) log "$SLAVEIF already member of $BRIDGE" ;;
"" ) log "Adding $SLAVEIF as member to $BRIDGE"
ip link set "$SLAVEIF" master "$BRIDGE" ;;
* ) error "interface $SLAVEIF have another master" ;;
esac
fi
# ------------------------------------------------------------------------------------
# Retrive network parameters
# ------------------------------------------------------------------------------------
log "Starting retriving parameters"
POD_NETWORK="${POD_NETWORK:-10.244.0.0/16}"
DIVISION_PREFIX="${DIVISION_PREFIX:-24}"
log "POD_NETWORK=$POD_NETWORK"
log "DIVISION_PREFIX=$DIVISION_PREFIX"
set -e
export "POD_$(ipcalc -p "$POD_NETWORK")" # POD_PREFIX
export "POD_$(ipcalc -b "$POD_NETWORK")" # POD_BROADCAST
export "POD_$(ipcalc -n "$POD_NETWORK")" # POD_NETWORK
export "FIRST_$(ipcalc -n "$POD_NETWORK/$DIVISION_PREFIX" )" # FIRST_NETWORK
export "LAST_$(ipcalc -n "$POD_BROADCAST/$DIVISION_PREFIX" )" # LAST_NETWORK
set +e
debug "POD_PREFIX=$POD_PREFIX"
debug "POD_BROADCAST=$POD_BROADCAST"
debug "POD_NETWORK=$POD_NETWORK"
debug "FIRST_NETWORK=$FIRST_NETWORK"
debug "LAST_NETWORK=$LAST_NETWORK"
NETWORKS_LIST="$(
CUR_NETWORK="$LAST_NETWORK"
until [ "$CUR_NETWORK" == "$FIRST_NETWORK" ]; do
echo "$CUR_NETWORK"
export CUR_"$(ipcalc -n "$(prev_ip "$CUR_NETWORK")/$DIVISION_PREFIX")"
done
)"
debug "NETWORKS_LIST=\"$(echo "$NETWORKS_LIST" | tr '\n' ' ' )\""
# ------------------------------------------------------------------------------------
# Configure IP-address
# ------------------------------------------------------------------------------------
log "Starting configuring IP-address"
# Check ip address
IPADDR="$(ip -f inet -o addr show "$BRIDGE" | grep -o -m1 'inet [^ /]*' | cut -d' ' -f2)"
# If ip not exist
if [ -z "$IPADDR" ]; then
if [ -f "$CNI_CONFIG" ]; then
CHECKING_IP=$(sed -n 's/.*"gateway": "\(.*\)",/\1/p' "$CNI_CONFIG")
log "Cni config found, taking old address $CHECKING_IP"
rm -f "$CNI_CONFIG"
fi
if [ -z $CHECKING_IP ] || ! gateway_is_right "$CHECKING_IP"; then
CHECKING_IP="$(random_gateway)"
log "New address generated $CHECKING_IP"
fi
log "Checking $CHECKING_IP"
while ! address_is_free "$CHECKING_IP"; do
log "Address $CHECKING_IP is not free"
CHECKING_IP="$(random_gateway)"
log "Taking another one $CHECKING_IP"
done
log "Address $CHECKING_IP is free, using it as gateway"
IPADDR="$CHECKING_IP"
log "Configuring $IPADDR/$POD_PREFIX on $BRIDGE"
ip addr change "$IPADDR/$POD_PREFIX" dev "$BRIDGE"
else
if ! gateway_is_right "$IPADDR"; then
error "$BRIDGE already have IP address not from the list"
fi
log "IP-address $IPADDR already set, use it"
fi
# ------------------------------------------------------------------------------------
# Configure cni
# ------------------------------------------------------------------------------------
log "Starting generating CNI configuration"
set -e
GATEWAY="$IPADDR"
SUBNET="${POD_NETWORK}/${POD_PREFIX}"
FIRST_IP="$(next_ip "${GATEWAY}")"
LAST_IP="$(prev_ip "$(ipcalc -b "${GATEWAY}/${DIVISION_PREFIX}" | cut -d= -f2)")"
set +e
debug "GATEWAY=$GATEWAY"
debug "SUBNET=$SUBNET"
debug "FIRST_IP=$FIRST_IP"
debug "LAST_IP=$LAST_IP"
log "Writing $CNI_CONFIG"
cat > $CNI_CONFIG <<EOT
{
"name": "bridget",
"type": "bridge",
"bridge": "${BRIDGE}",
"ipMasq": true,
"mtu": ${MTU:-1500},
"ipam": {
"type": "host-local",
"subnet": "${SUBNET}",
"rangeStart": "${FIRST_IP}",
"rangeEnd": "${LAST_IP}",
"gateway": "${GATEWAY}",
"routes": [
{ "dst": "0.0.0.0/0" }
]
}
}
EOT
debug "$(cat "$CNI_CONFIG")"
# ------------------------------------------------------------------------------------
# Sleep gently
# ------------------------------------------------------------------------------------
exec tail -f /dev/null