networking services restart hangs due to missing /etc/network/run/ifenslave.* files
| Affects | Status | Importance | Assigned to | Milestone | |
|---|---|---|---|---|---|
| | ifenslave (Ubuntu) |
Undecided
|
Unassigned | ||
Bug Description
Ubuntu 12.04 LTS
ifenslave-2.6
ifup hangs when bonds are configured and networking is restarted via '/etc/init.
##/etc/
#!/bin/sh
[ "$VERBOSITY" = 1 ] && set -x
IFSTATE=
add_master()
{
# Return if $BOND_MASTER is already a bonding interface.
[ -f "/sys/class/
# If the bonding module is not yet loaded, load it.
if [ ! -r /sys/class/
modprobe -q bonding
FAILED=1
echo "Waiting for bonding kernel module to be ready (will timeout after 5s)"
for i in $(seq 50); do
if [ -r /sys/class/
FAILED=0
break
fi
sleep 0.1
done
if [ "$FAILED" = "1" ]; then
echo "/sys/class/
exit 1
fi
fi
# Create the master interface.
if ! grep -sq "\\<$BOND_
echo "+$BOND_MASTER" > /sys/class/
fi
}
sysfs_change_down()
{
# Called with :
# $1 = basename of the file in bonding/ to write to.
# $2 = value to write. Won't write if $2 is empty.
if [ "$2" ] ; then
# If the value we plan to write is different from the current one...
if ! grep -sq "\\<$2\\>" "/sys/class/
# ...and the master is up...
if ip link show "$BOND_MASTER" | grep -sq '[<,]UP[,>]' ; then
# ...bring the master down.
ip link set dev "$BOND_MASTER" down
fi
fi
sysfs "$1" "$2"
fi
}
sysfs()
{
# Called with :
# $1 = basename of the file in bonding/ to write to.
# $2 = value to write. Won't write if $2 is empty.
if [ "$2" ] ; then
echo "$2" > "/sys/class/
return $?
fi
return 0
}
sysfs_add()
{
#??Called with :
# $1 = target filename.
# $2 = values to write.
for value in $2; do
# Do not add $2 to $1 if already present.
if ! grep -sq "\\<$value\\>" /sys/class/
then
sysfs "$1" "+$value"
fi
done
}
# early_setup_master is the place where we do master setup that need to be done before enslavement.
early_setup_
{
# Warning: the order in wich we write into the sysfs files is important.
# Double check in drivers/
# before changing anything here.
# fail_over_mac must be set before enslavement of any slaves.
sysfs fail_over_mac "$IF_BOND_
}
# late_setup_master runs actions that need to happen after enslavement
late_setup_master()
{
# primary must be set after mode (because only supported in some modes) and after enslavement.
# The first slave in bond-primary found in current slaves becomes the primary.
# If no slave in bond-primary is found, then primary does not change.
for slave in $IF_BOND_PRIMARY ; do
if grep -sq "\\<$slave\\>" "/sys/class/
sysfs primary "$slave"
break
fi
done
# primary_reselect should be set after mode (because only supported in some modes), after enslavement
# and after primary. This is currently (2.6.35-rc1) not enforced by the bonding driver, but it is
# probably safer to do it in that order.
sysfs primary_reselect "$IF_BOND_
# queue_id must be set after enslavement.
for iface_queue_id in $IF_BOND_QUEUE_ID
do
sysfs iface_queue_id $iface_queue_id
done
# active_slave must be set after mode and after enslavement.
# The slave must be up and the underlying link must be up too.
# FIXME: We should have a way to write an empty string to active_slave, to set the active_slave to none.
if [ "$IF_BOND_
# Need to force interface up before. Bonding will refuse to activate a down interface.
ip link set "$IF_BOND_
sysfs active_slave "$IF_BOND_
fi
}
enslave_slaves()
{
case "$BOND_SLAVES" in
none)
BOND_SLAVES=""
;;
all)
BOND_SLAVES=`sed -ne 's/ *\(eth[
AUTOIF="yes"
;;
esac
[ "$VERBOSITY" = 1 ] && v=-v
for slave in $BOND_SLAVES ; do
if ( [ "$AUTOIF" ] && grep -q "^$slave=" $IFSTATE ) ; then
echo "Not enslaving interface $slave since it is already configured"
else
# Ensure $slave is down.
ip link set "$slave" down 2>/dev/null
if ! sysfs_add slaves "$slave" 2>/dev/null ; then
echo "Failed to enslave $slave to $BOND_MASTER. Is $BOND_MASTER ready and a bonding interface ?" >&2
else
# Bring up slave if it is the target of an allow-bondX stanza.
# This is usefull to bring up slaves that need extra setup.
if [ -z "$(which ifquery)" ] || ifquery --allow \"$BOND_MASTER\" --list | grep -q $slave; then
ifup $v --allow "$BOND_MASTER" "$slave"
fi
fi
fi
done
}
setup_master()
{
# Warning: the order in wich we write into the sysfs files is important.
# Double check in drivers/
# before changing anything here.
# use_carrier can be set anytime.
sysfs use_carrier "$IF_BOND_
# num_grat_arp can be set anytime.
sysfs num_grat_arp "$IF_BOND_
# num_unsol_na can be set anytime.
sysfs num_unsol_na "$IF_BOND_
# xmit_hash_policy can be set anytime.
# Changing xmit_hash_policy requires $BOND_MASTER to be down.
sysfs_change_down xmit_hash_policy "$IF_BOND_
# arp_ip_target must be set before arp_interval.
sysfs_add arp_ip_target "$IF_BOND_
sysfs arp_interval "$IF_BOND_
# miimon must be set before updelay and downdelay.
sysfs miimon "$IF_BOND_MIIMON"
sysfs downdelay "$IF_BOND_
sysfs updelay "$IF_BOND_UPDELAY"
# Changing ad_select requires $BOND_MASTER to be down.
sysfs_change_down ad_select "$IF_BOND_
# Changing mode requires $BOND_MASTER to be down.
# Mode should be set after miimon or arp_interval, to avoid a warning in syslog.
sysfs_change_down mode "$IF_BOND_MODE"
# arp_validate must be after mode (because mode must be active-backup).
sysfs arp_validate "$IF_BOND_
# lacp_rate must be set after mode (because mode must be 802.3ad).
# Changing lacp_rate requires $BOND_MASTER to be down.
sysfs_change_down lacp_rate "$IF_BOND_
# Finally bring the bond up, note that without a slave it won't be usable though
ip link set dev $BOND_MASTER up
}
# Option slaves deprecated, replaced by bond-slaves, but still supported for backward compatibility.
IF_BOND_
if [ "$IF_BOND_MASTER" ] ; then
BOND_MASTER=
BOND_SLAVES=
else
if [ "$IF_BOND_SLAVES" ] ; then
BOND_
BOND_
fi
fi
# Exit if nothing to do...
[ -z "$BOND_
# Always try to create the master, returns if already exists
add_master
if [ "$BOND_MASTER" = "$IFACE" ]; then
# Setup the master interface
early_setup_master
setup_master
# Indicate that we're done setting up the master
# this is required as ifstate is modified at the beginning
# of the interface setup, not at the end
touch /run/network/
# Wait for a slave to join, continuing without a slave
# would make dhclient, vconfig or brctl fail, so better wait
# Timeout after a minute
FAILED=1
echo "Waiting for a slave to join $BOND_MASTER (will timeout after 60s)"
for i in $(seq 600); do
if [ -n "$(cat /sys/class/
FAILED=0
break
fi
sleep 0.1
done
if [ "$FAILED" = "1" ]; then
echo "No slave joined $BOND_MASTER, continuing anyway"
else
# Trigger the udev bridging hook to bridge the bond if needed
if [ -x /lib/udev/
INTERFACE=
fi
# Trigger the udev bridging hook to tag the bond if needed
if [ -x /lib/udev/
INTERFACE=
fi
fi
else
# Wait for the master to be ready
[ ! -f /run/network/
while :; do
if [ -f /run/network/
break
fi
sleep 0.1
done
# Only setup one slave at once
BOND_SLAVES=$IFACE enslave_slaves
# Call late_setup_master every time we add a slave as we don't have a way to know
# when all the slaves are up
BOND_SLAVES=$IFACE late_setup_master
fi
exit 0
## /etc/network/
# This file describes the network interfaces available on your system
# and how they will be activated. For more information, see interfaces(5).
# chef managed!
auto eth1
iface eth1 inet manual
bond-master bond0
bond-primary eth1
# default bridge interface
auto backend
iface backend inet manual
bridge_fd 0
bridge_ports vlan10
bridge_stp off
# failover nic team
auto bond0
iface bond0 inet manual
bond-miimon 100
bond-mode active-backup
bond-primary eth1
bond-slaves none
# The VM network interface
auto eth0
iface eth0 inet static
address 10.0.2.15
broadcast 10.0.2.255
gateway 10.0.2.0
netmask 255.255.255.0
# The loopback interface
auto lo
iface lo inet loopback
# default vlan interface
auto vlan10
iface vlan10 inet manual
vlan_raw_device bond0
ProblemType: Bug
DistroRelease: Ubuntu 12.04
Package: ifenslave-2.6 1.1.0-19ubuntu5
ProcVersionSign
Uname: Linux 3.2.0-32-generic x86_64
ApportVersion: 2.0.1-0ubuntu17.1
Architecture: amd64
Date: Thu Jan 16 17:34:48 2014
InstallationMedia: Ubuntu-Server 12.04.1 LTS "Precise Pangolin" - Release amd64 (20120817.3)
MarkForUpload: True
ProcEnviron:
TERM=xterm
PATH=(custom, no user)
LANG=en_US.UTF-8
SHELL=/bin/bash
SourcePackage: ifenslave-2.6
UpgradeStatus: No upgrade log present (probably fresh install)
| Keegan Holley (keeganh) wrote : | #1 |
| Keegan Holley (keeganh) wrote : | #2 |
| affects: | ifenslave-2.6 (Ubuntu) → ifenslave (Ubuntu) |
| Stéphane Graber (stgraber) wrote : | #3 |
/etc/init.
Rather than copy/paste half the code of ifenslave, could you instead post your current /etc/network/
As a reminder, ifupdown is entirely sequential it's therefore required for the ordering to be roughly:
- loopback
- primary physical interface (bond member)
- any other physical interface (bond member)
- bond interface
- any virtual interface (vlan, bridge, ...) based on top of the bond
If the interfaces aren't listed in precisely that order, "ifup -a" will hang (though the boot itself won't as it's using events to bring up individual interfaces rather than using ifup -a).
| Changed in ifenslave (Ubuntu): | |
| status: | New → Incomplete |
| Launchpad Janitor (janitor) wrote : | #4 |
[Expired for ifenslave (Ubuntu) because there has been no activity for 60 days.]
| Changed in ifenslave (Ubuntu): | |
| status: | Incomplete → Expired |
| Stefan Andres (s-andres) wrote : | #5 |
I have the same problem. I've a box with 4 NICs.
2x1 GigE Intel cards (eth1, eth3)
2x10 GigE Broadcoam cards (eth0, eth2)
I'm booting up with the first Intel card which gets an DHCP IP which works fine:
https:/
Then I swap that interfaces file (in the end by puppet, but now manually for debugging):
https:/
Then I do ifdown -a which brings all interfaces down and then do a ifup -a -v and then ifup -a hangs forever in the [ -f /run/network/
https:/
| Changed in ifenslave (Ubuntu): | |
| status: | Expired → New |
| Launchpad Janitor (janitor) wrote : | #6 |
Status changed to 'Confirmed' because the bug affects multiple users.
| Changed in ifenslave (Ubuntu): | |
| status: | New → Confirmed |
| Johannes Grassler (jgr-launchpad) wrote : | #7 |
We now fixed this locally by hacking up a less flexible but working alternative to ifenslave:
| Cory Wright (corywright) wrote : | #8 |
This bug is also affecting our 12.04 LTS systems. It seems to have something to do with whether or not the bonding module is already loaded.
| Sven Hoexter (sven-timegate) wrote : | #9 |
Instead of replacing the whole (broken) ifenslave script, it seems to work to just bring up the bond yourself via pre-up.
It's ugly and working somehow against upstart but works for the moment[tm] and you can stay to your own habbits of using ifup/ifdown. :(
auto eth1 eth2 bond0
iface eth1 inet manual
bond-master bond0
iface eth2 inet manual
bond-master bond0
iface bond0 inet static
address 192.168.1.1
netmask 255.255.255.0
bond-primary eth1
bond-slaves eth1 eth2
pre-up echo +bond0 > /sys/class/
pre-up ifenslave bond0 eth1 eth2
| Sven Hoexter (sven-timegate) wrote : | #10 |
small but important mistake in the bond0 stanza:
- pre-up echo +bond0 > /sys/class/
+ pre-up echo +bond0 > /sys/class/
| Andrew McDermott (frobware) wrote : | #11 |
I was trying to do something very similar for Juju - when the machine boots we rewrite /etc/network/
Our sequence is:
$ ifdown -a
$ transform --in-place /etc/network/
$ ifup -a
and with bonds configured using 802.3ad this would always hang on the ifup stage.
If I add a:
$ sleep 0.5
after the transform stage then the sequence of ifdown/up seems to work very reliably.
| Andrew McDermott (frobware) wrote : | #12 |
To clarify, my "transform" script just bridges active interfaces.
| Cory Wright (corywright) wrote : | #13 |
This bug has persisted through three LTS releases (12.04, 14.04, 16.04) and had bitten me on each one.
Are there plans to fix this?


The root cause is in /etc/networking /if-pre- up.d/ifenslave. In starting at line 260.
if the /etc/run/ network/ ifenslave. <BOND> file doesn't exist ifup goes into an unterminated while loop, since there is nothing inside the loop that will create the file.
[ ! -f /run/network/ ifenslave. $BOND_MASTER ] && echo "Waiting for bond master $BOND_MASTER to be ready" ifenslave. $BOND_MASTER ]; then
while :; do
if [ -f /run/network/
break
fi
sleep 0.1
done